{ "caption_matching": { "1034419625": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is dribbling a basketball.\nOption 2: A man is dunking a basketball.", "gt-answer": "Option 2: A man is dunking a basketball.", "video-llm-prediction": "Option 2: A man is dunking a basketball.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A man is dunking a basketball.\nSentence B: A video showing a person passing a basketball.", "gt-answer": "Sentence A: A man is dunking a basketball.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A man is dunking a basketball.\nCaption B: The man is shooting a basketball.", "gt-answer": "Caption A: A man is dunking a basketball.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is moving from left to right.\nSentence B: The man is moving from right to left.", "gt-answer": "Sentence A: The man is moving from left to right.", "video-llm-prediction": "Sentence B: The man is moving from right to left.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: From the camera's point of view, the man is moving from right to left.\nOption 2: The man is moving from left to right.", "gt-answer": "Option 2: The man is moving from left to right.", "video-llm-prediction": "Option 1: From the camera's point of view, the man is moving from right to left.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The man is moving from right to left.\nCaption B: The man is moving from left to right.", "gt-answer": "Caption B: The man is moving from left to right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1034419625_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is moving from left to right.\nSentence B: The man is moving from right to left.", "gt-answer": "Sentence B: The man is moving from right to left.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: From the camera's point of view, the man is moving from right to left.\nOption 2: The man is moving from left to right.", "gt-answer": "Option 1: From the camera's point of view, the man is moving from right to left.", "video-llm-prediction": "Option 1: From the camera's point of view, the man is moving from right to left.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is moving from right to left.\nCaption B: The man is moving from left to right.", "gt-answer": "Caption A: The man is moving from right to left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1094590221": { "action": [ { "question": "Which caption matches the video better?\nCaption A: A man is shooting basketball in the video.\nCaption B: A man is dunking basketball in the video.", "gt-answer": "Caption A: A man is shooting basketball in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is spinning basketball.\nSentence B: A man is shooting basketball in the video.", "gt-answer": "Sentence B: A man is shooting basketball in the video.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A man is shooting basketball in the video.\nOption 2: A person is dribbling basketball in the video.", "gt-answer": "Option 1: A man is shooting basketball in the video.", "video-llm-prediction": "Option 1: A man is shooting basketball in the video.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The basketball is moving from right to left.\nSentence B: The basketball is moving from left to right.", "gt-answer": "Sentence A: The basketball is moving from right to left.", "video-llm-prediction": "Sentence B: The basketball is moving from left to right.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The basketball is moving from right to left.\nOption 2: The basketball is moving from left to right.", "gt-answer": "Option 1: The basketball is moving from right to left.", "video-llm-prediction": "Option 2: The basketball is moving from left to right.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The basketball is moving from right to left.\nCaption B: The basketball is moving from left to right.", "gt-answer": "Caption A: The basketball is moving from right to left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1094590221_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The basketball is moving from right to left.\nSentence B: The basketball is moving from left to right.", "gt-answer": "Sentence B: The basketball is moving from left to right.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The basketball is moving from right to left.\nOption 2: The basketball is moving from left to right.", "gt-answer": "Option 2: The basketball is moving from left to right.", "video-llm-prediction": "Option 1: The basketball is moving from right to left.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The basketball is moving from right to left.\nCaption B: The basketball is moving from left to right.", "gt-answer": "Caption B: The basketball is moving from left to right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1098982673": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is eating and singing.\nOption 2: The woman is dancing and singing.", "gt-answer": "Option 2: The woman is dancing and singing.", "video-llm-prediction": "Option 2: The woman is dancing and singing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is sleeping and singing.\nCaption B: The woman is dancing and singing.", "gt-answer": "Caption B: The woman is dancing and singing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is running and singing.\nSentence B: The woman is dancing and singing.", "gt-answer": "Sentence B: The woman is dancing and singing.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at normal speed.\nSentence B: The video is playing in slow motion.", "gt-answer": "Sentence A: The video is playing at normal speed.", "video-llm-prediction": "Sentence B: The video is playing in slow motion.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is fast forwarded.\nCaption B: The video is playing at normal speed.", "gt-answer": "Caption B: The video is playing at normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at normal speed.\nOption 2: The video is being played in reverse.", "gt-answer": "Option 1: The video is playing at normal speed.", "video-llm-prediction": "Option 1: The video is playing at normal speed.", "match_success": true, "rating": 1 } ] }, "1111657885": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The people are skiing.\nSentence B: The people are ice skating.", "gt-answer": "Sentence B: The people are ice skating.", "video-llm-prediction": "Sentence B: The people are ice skating.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The people are ice skating.\nCaption B: The people are swimming.", "gt-answer": "Caption A: The people are ice skating.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people are ice skating.\nOption 2: A sport being played by the people is tennis.", "gt-answer": "Option 1: The people are ice skating.", "video-llm-prediction": "Option 1: The people are ice skating.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which caption matches the video better?\nCaption A: The video is presented at a rapid pace.\nCaption B: The video has a slow motion tempo.", "gt-answer": "Caption B: The video has a slow motion tempo.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The entire video is in normal speed.\nOption 2: The video has a slow motion tempo.", "gt-answer": "Option 2: The video has a slow motion tempo.", "video-llm-prediction": "Option 2: The video has a slow motion tempo.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is paused.\nSentence B: The video has a slow motion tempo.", "gt-answer": "Sentence B: The video has a slow motion tempo.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The people are parallel to the screen.\nCaption B: The people are skating towards the camera.", "gt-answer": "Caption B: The people are skating towards the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people are skating away from the camera.\nOption 2: The people are skating towards the camera.", "gt-answer": "Option 2: The people are skating towards the camera.", "video-llm-prediction": "Option 2: The people are skating towards the camera.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The people are skating away from the camera.\nSentence B: The people are skating towards the camera.", "gt-answer": "Sentence B: The people are skating towards the camera.", "video-llm-prediction": "Sentence A: The people are skating away from the camera.", "match_success": true, "rating": 0 } ] }, "1111657885_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The people are parallel to the screen.\nCaption B: The people are skating towards the camera.", "gt-answer": "Caption A: The people are parallel to the screen.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people are skating away from the camera.\nOption 2: The people are skating towards the camera.", "gt-answer": "Option 1: The people are skating away from the camera.", "video-llm-prediction": "Option 2: The people are skating towards the camera.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The people are skating away from the camera.\nSentence B: The people are skating towards the camera.", "gt-answer": "Sentence A: The people are skating away from the camera.", "video-llm-prediction": "Sentence B: The people are skating towards the camera.", "match_success": true, "rating": 0 } ] }, "1073873933": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A video is showing a fight.\nOption 2: A person is eating.", "gt-answer": "Option 1: A video is showing a fight.", "video-llm-prediction": "Option 1: A video is showing a fight.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A video is showing a fight.\nCaption B: The monkey is swimming.", "gt-answer": "Caption A: A video is showing a fight.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A video is showing a fight.\nSentence B: Someone is running.", "gt-answer": "Sentence A: A video is showing a fight.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1089810425": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The people are dancing.\nSentence B: The people are cooking.", "gt-answer": "Sentence A: The people are dancing.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The people are dancing.\nCaption B: A video showing people sleeping.", "gt-answer": "Caption A: The people are dancing.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people are painting.\nOption 2: The people are dancing.", "gt-answer": "Option 2: The people are dancing.", "video-llm-prediction": "Option 2: The people are dancing.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the video is normal.\nSentence B: The video is in slow motion.", "gt-answer": "Sentence A: The speed of the video is normal.", "video-llm-prediction": "Sentence B: The video is in slow motion.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is in time-lapse.\nOption 2: The speed of the video is normal.", "gt-answer": "Option 2: The speed of the video is normal.", "video-llm-prediction": "Option 1: The video is in time-lapse.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the video is normal.\nCaption B: The tempo of the entire video is fast.", "gt-answer": "Caption A: The speed of the video is normal.", "video-llm-prediction": "Caption B: The tempo of the entire video is fast.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The video is panning from left to right.\nCaption B: The video is panning from right to left.", "gt-answer": "Caption B: The video is panning from right to left.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The panning in the video is from left to right.\nSentence B: The panning in the video is from right to left.", "gt-answer": "Sentence B: The panning in the video is from right to left.", "video-llm-prediction": "Sentence B: The panning in the video is from right to left.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The panning in the video is from left to right.\nOption 2: The panning in the video is from right to left.", "gt-answer": "Option 2: The panning in the video is from right to left.", "video-llm-prediction": "Option 2: The panning in the video is from right to left.", "match_success": true, "rating": 1 } ] }, "1089810425_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The video is panning from left to right.\nCaption B: The video is panning from right to left.", "gt-answer": "Caption A: The video is panning from left to right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The panning in the video is from left to right.\nSentence B: The panning in the video is from right to left.", "gt-answer": "Sentence A: The panning in the video is from left to right.", "video-llm-prediction": "Sentence B: The panning in the video is from right to left.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The panning in the video is from left to right.\nOption 2: The panning in the video is from right to left.", "gt-answer": "Option 1: The panning in the video is from left to right.", "video-llm-prediction": "Option 2: The panning in the video is from right to left.", "match_success": true, "rating": 0 } ] }, "1077507593": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The people in the video are cooking.\nSentence B: The people in the video are sleeping.", "gt-answer": "Sentence A: The people in the video are cooking.", "video-llm-prediction": "Sentence A: The people in the video are cooking.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The people in the video are cooking.\nCaption B: A person is eating in the video.", "gt-answer": "Caption A: The people in the video are cooking.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people in the video are cooking.\nOption 2: There is dancing happening in the video.", "gt-answer": "Option 1: The people in the video are cooking.", "video-llm-prediction": "Option 1: The people in the video are cooking.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is in slow motion.\nSentence B: The video is at normal speed.", "gt-answer": "Sentence A: The video is in slow motion.", "video-llm-prediction": "Sentence A: The video is in slow motion.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is in slow motion.\nCaption B: The video is in time-lapse.", "gt-answer": "Caption A: The video is in slow motion.", "video-llm-prediction": "Caption A: The video is in slow motion.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is in slow motion.\nOption 2: The events in the video are happening at a fast rate.", "gt-answer": "Option 1: The video is in slow motion.", "video-llm-prediction": "Option 1: The video is in slow motion.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The skillet is smoking, and then it is burning in fire.\nSentence B: The skillet is burning in fire, and then it is smoking.", "gt-answer": "Sentence A: The skillet is smoking, and then it is burning in fire.", "video-llm-prediction": "Sentence A: The skillet is smoking, and then it is burning in fire.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The skillet is smoking after burning in fire.\nOption 2: The skillet is smoking, and then it is burning in fire.", "gt-answer": "Option 2: The skillet is smoking, and then it is burning in fire.", "video-llm-prediction": "Option 1: The skillet is smoking after burning in fire.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The skillet is neither smoking nor burning.\nCaption B: The skillet is smoking, and then it is burning in fire.", "gt-answer": "Caption B: The skillet is smoking, and then it is burning in fire.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1107116885": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is swimming.\nOption 2: The man is shooting an arrow.", "gt-answer": "Option 2: The man is shooting an arrow.", "video-llm-prediction": "Option 2: The man is shooting an arrow.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A person is running.\nCaption B: The man is shooting an arrow.", "gt-answer": "Caption B: The man is shooting an arrow.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: He is playing soccer.\nSentence B: The man is shooting an arrow.", "gt-answer": "Sentence B: The man is shooting an arrow.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing with time-lapse effect.\nOption 2: The video is playing at a normal speed.", "gt-answer": "Option 2: The video is playing at a normal speed.", "video-llm-prediction": "Option 1: The video is playing with time-lapse effect.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The pace of the video is slow motion.\nCaption B: The video is playing at a normal speed.", "gt-answer": "Caption B: The video is playing at a normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at a normal speed.\nSentence B: The video is playing at a rapid speed.", "gt-answer": "Sentence A: The video is playing at a normal speed.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1059718130": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The video is playing in time-lapse.\nCaption B: The speed of the video is slow motion.", "gt-answer": "Caption A: The video is playing in time-lapse.", "video-llm-prediction": "Caption A: The video is playing in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing in stop motion.\nSentence B: The video is playing in time-lapse.", "gt-answer": "Sentence B: The video is playing in time-lapse.", "video-llm-prediction": "Sentence B: The video is playing in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing in time-lapse.\nOption 2: The pace at which the video is playing is fast-forward.", "gt-answer": "Option 1: The video is playing in time-lapse.", "video-llm-prediction": "Option 1: The video is playing in time-lapse.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun is rising.\nSentence B: The sun is setting.", "gt-answer": "Sentence A: The sun is rising.", "video-llm-prediction": "Sentence B: The sun is setting.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The sun is falling.\nCaption B: The sun is rising.", "gt-answer": "Caption B: The sun is rising.", "video-llm-prediction": "Caption B: The sun is rising.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun is moving downwards.\nOption 2: The sun is moving upwards.", "gt-answer": "Option 2: The sun is moving upwards.", "video-llm-prediction": "Option 1: The sun is moving downwards.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The video's brightness is turning brighter.\nCaption B: The video's brightness is getting darker.", "gt-answer": "Caption A: The video's brightness is turning brighter.", "video-llm-prediction": "Caption A: The video's brightness is turning brighter.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video's brightness is turning brighter.\nSentence B: The attribute of brightness is remaining stable.", "gt-answer": "Sentence A: The video's brightness is turning brighter.", "video-llm-prediction": "Sentence A: The video's brightness is turning brighter.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video's brightness is turning brighter.\nOption 2: The brightness is decreasing.", "gt-answer": "Option 1: The video's brightness is turning brighter.", "video-llm-prediction": "Option 1: The video's brightness is turning brighter.", "match_success": true, "rating": 1 } ] }, "1059718130_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun is rising.\nSentence B: The sun is setting.", "gt-answer": "Sentence B: The sun is setting.", "video-llm-prediction": "Sentence B: The sun is setting.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The sun is falling.\nCaption B: The sun is rising.", "gt-answer": "Caption A: The sun is falling.", "video-llm-prediction": "Caption B: The sun is rising.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun is moving downwards.\nOption 2: The sun is moving upwards.", "gt-answer": "Option 1: The sun is moving downwards.", "video-llm-prediction": "Option 1: The sun is moving downwards.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The video's brightness is turning brighter.\nCaption B: The video's brightness is getting darker.", "gt-answer": "Caption B: The video's brightness is getting darker.", "video-llm-prediction": "Caption B: The video's brightness is getting darker.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video's brightness is turning brighter.\nSentence B: The attribute of brightness is remaining stable.", "gt-answer": "Sentence B: The attribute of brightness is remaining stable.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video's brightness is turning brighter.\nOption 2: The brightness is decreasing.", "gt-answer": "Option 2: The brightness is decreasing.", "video-llm-prediction": "Option 2: The brightness is decreasing.", "match_success": true, "rating": 1 } ] }, "1083845854": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at time-lapse speed.\nSentence B: The video is playing at slow motion speed.", "gt-answer": "Sentence A: The video is playing at time-lapse speed.", "video-llm-prediction": "Sentence A: The video is playing at time-lapse speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing at normal speed.\nCaption B: The video is playing at time-lapse speed.", "gt-answer": "Caption B: The video is playing at time-lapse speed.", "video-llm-prediction": "Caption B: The video is playing at time-lapse speed.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at time-lapse speed.\nOption 2: The video is playing in fast-forward mode.", "gt-answer": "Option 1: The video is playing at time-lapse speed.", "video-llm-prediction": "Option 1: The video is playing at time-lapse speed.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The clock hands are moving clockwise.\nOption 2: The clock hands are moving counterclockwise.", "gt-answer": "Option 1: The clock hands are moving clockwise.", "video-llm-prediction": "Option 1: The clock hands are moving clockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The clock hands are moving counterclockwise.\nSentence B: The clock hands are moving clockwise.", "gt-answer": "Sentence B: The clock hands are moving clockwise.", "video-llm-prediction": "Sentence A: The clock hands are moving counterclockwise.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The clock hands are rotating counterclockwise.\nCaption B: The clock hands are rotating clockwise.", "gt-answer": "Caption B: The clock hands are rotating clockwise.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1050618460": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the entire video is normal speed.\nSentence B: The speed of the entire video is time-lapse.", "gt-answer": "Sentence B: The speed of the entire video is time-lapse.", "video-llm-prediction": "Sentence B: The speed of the entire video is time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the entire video is slow motion.\nCaption B: The speed of the entire video is time-lapse.", "gt-answer": "Caption B: The speed of the entire video is time-lapse.", "video-llm-prediction": "Caption B: The speed of the entire video is time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the entire video is time-lapse.\nOption 2: The pace of the entire video is slow-paced.", "gt-answer": "Option 1: The speed of the entire video is time-lapse.", "video-llm-prediction": "Option 1: The speed of the entire video is time-lapse.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The flowers are withering.\nSentence B: The flowers are turning into full bloom.", "gt-answer": "Sentence B: The flowers are turning into full bloom.", "video-llm-prediction": "Sentence B: The flowers are turning into full bloom.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The flowers are turning into full bloom.\nCaption B: The flowers are shrinking and wilting.", "gt-answer": "Caption A: The flowers are turning into full bloom.", "video-llm-prediction": "Caption A: The flowers are turning into full bloom.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The flowers are turning into full bloom.\nOption 2: The flowers are turning into buds.", "gt-answer": "Option 1: The flowers are turning into full bloom.", "video-llm-prediction": "Option 1: The flowers are turning into full bloom.", "match_success": true, "rating": 1 } ] }, "1083113449": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the video is time-lapse.\nOption 2: The speed of the video is slow motion.", "gt-answer": "Option 1: The speed of the video is time-lapse.", "video-llm-prediction": "Option 1: The speed of the video is time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the video is time-lapse.\nSentence B: The video is in normal speed.", "gt-answer": "Sentence A: The speed of the video is time-lapse.", "video-llm-prediction": "Sentence A: The speed of the video is time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the video is rewind.\nCaption B: The speed of the video is time-lapse.", "gt-answer": "Caption B: The speed of the video is time-lapse.", "video-llm-prediction": "Caption B: The speed of the video is time-lapse.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The sky is maintaining its brightness.\nCaption B: The sky is getting darker.", "gt-answer": "Caption B: The sky is getting darker.", "video-llm-prediction": "Caption B: The sky is getting darker.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sky is lightening up.\nOption 2: The sky is getting darker.", "gt-answer": "Option 2: The sky is getting darker.", "video-llm-prediction": "Option 2: The sky is getting darker.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sky is getting darker.\nSentence B: The sky is brightening.", "gt-answer": "Sentence A: The sky is getting darker.", "video-llm-prediction": "Sentence A: The sky is getting darker.", "match_success": true, "rating": 1 } ] }, "1091143117": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is in normal speed.\nOption 2: The video is in time-lapse.", "gt-answer": "Option 1: The video is in normal speed.", "video-llm-prediction": "Option 1: The video is in normal speed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is in slow motion.\nSentence B: The video is in normal speed.", "gt-answer": "Sentence B: The video is in normal speed.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is in normal speed.\nCaption B: The video is moving backwards.", "gt-answer": "Caption A: The video is in normal speed.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The eye is changing from closed to open.\nOption 2: The eye is blinking rapidly.", "gt-answer": "Option 1: The eye is changing from closed to open.", "video-llm-prediction": "Option 1: The eye is changing from closed to open.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The eye is changing from closed to open.\nCaption B: The eye is changing from open to closed.", "gt-answer": "Caption A: The eye is changing from closed to open.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The eye is changing from closed to open.\nSentence B: The eye is changing from open to closed.", "gt-answer": "Sentence A: The eye is changing from closed to open.", "video-llm-prediction": "Sentence A: The eye is changing from closed to open.", "match_success": true, "rating": 1 } ] }, "1100329207": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The sheep is sleeping.\nCaption B: A sheep is running.", "gt-answer": "Caption B: A sheep is running.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sheep is eating grass.\nSentence B: A sheep is running.", "gt-answer": "Sentence B: A sheep is running.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A sheep is running.\nOption 2: The sheep is swimming.", "gt-answer": "Option 1: A sheep is running.", "video-llm-prediction": "Option 1: A sheep is running.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The camera view is moving right.\nOption 2: The camera view is moving forward.", "gt-answer": "Option 2: The camera view is moving forward.", "video-llm-prediction": "Option 2: The camera view is moving forward.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The camera view is moving forward.\nCaption B: The camera view is moving backward.", "gt-answer": "Caption A: The camera view is moving forward.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera view is moving forward.\nSentence B: The camera view is moving left.", "gt-answer": "Sentence A: The camera view is moving forward.", "video-llm-prediction": "Sentence A: The camera view is moving forward.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at normal speed.\nOption 2: The video is fast-forwarded.", "gt-answer": "Option 1: The video is playing at normal speed.", "video-llm-prediction": "Option 1: The video is playing at normal speed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at normal speed.\nSentence B: The video is playing in reverse speed.", "gt-answer": "Sentence A: The video is playing at normal speed.", "video-llm-prediction": "Sentence A: The video is playing at normal speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is in super slow motion.\nCaption B: The video is playing at normal speed.", "gt-answer": "Caption B: The video is playing at normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1089201973": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The people in the video are spinning football.\nOption 2: The people in the video are kicking a football.", "gt-answer": "Option 2: The people in the video are kicking a football.", "video-llm-prediction": "Option 2: The people in the video are kicking a football.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The people in the video are kicking a football.\nSentence B: The people in the video are stopping football.", "gt-answer": "Sentence A: The people in the video are kicking a football.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The people in the video are throwing football.\nCaption B: The people in the video are kicking a football.", "gt-answer": "Caption B: The people in the video are kicking a football.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at normal speed.\nSentence B: The video is playing in slow motion.", "gt-answer": "Sentence B: The video is playing in slow motion.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is time-lapse.\nCaption B: The video is playing in slow motion.", "gt-answer": "Caption B: The video is playing in slow motion.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing in rapid speed.\nOption 2: The video is playing in slow motion.", "gt-answer": "Option 2: The video is playing in slow motion.", "video-llm-prediction": "Option 2: The video is playing in slow motion.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The football is moving from right to left.\nOption 2: The football is moving from left to right in the video.", "gt-answer": "Option 2: The football is moving from left to right in the video.", "video-llm-prediction": "Option 2: The football is moving from left to right in the video.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The football is moving from left to right in the video.\nSentence B: The football is moving from right to left in the video.", "gt-answer": "Sentence A: The football is moving from left to right in the video.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The football is moving upwards.\nCaption B: The football is moving from left to right in the video.", "gt-answer": "Caption B: The football is moving from left to right in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1034736653": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman athletes are running.\nSentence B: The woman athletes are cycling.", "gt-answer": "Sentence A: The woman athletes are running.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman athletes are running.\nOption 2: The woman athletes are swimming.", "gt-answer": "Option 1: The woman athletes are running.", "video-llm-prediction": "Option 1: The woman athletes are running.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman athletes are running.\nCaption B: The woman athletes are dancing.", "gt-answer": "Caption A: The woman athletes are running.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman closest to the camera is moving at a normal speed.\nSentence B: The woman closest to the camera is moving at the fastest speed.", "gt-answer": "Sentence B: The woman closest to the camera is moving at the fastest speed.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Compared to others, the woman closest to the camera is moving at the same speed.\nCaption B: The woman closest to the camera is moving at the fastest speed.", "gt-answer": "Caption B: The woman closest to the camera is moving at the fastest speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman closest to the camera is moving at the fastest speed.\nOption 2: The woman closest to the camera is moving at the slowest speed.", "gt-answer": "Option 1: The woman closest to the camera is moving at the fastest speed.", "video-llm-prediction": "Option 1: The woman closest to the camera is moving at the fastest speed.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman athletes are running from right to left.\nOption 2: The woman athletes are running from left to right.", "gt-answer": "Option 2: The woman athletes are running from left to right.", "video-llm-prediction": "Option 2: The woman athletes are running from left to right.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman athletes are running from left to right.\nSentence B: The woman athletes are running from right to left.", "gt-answer": "Sentence A: The woman athletes are running from left to right.", "video-llm-prediction": "Sentence A: The woman athletes are running from left to right.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman athletes are running from top to bottom.\nCaption B: The woman athletes are running from left to right.", "gt-answer": "Caption B: The woman athletes are running from left to right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1098153561": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at a regular pace.\nOption 2: The video is playing in fast forward.", "gt-answer": "Option 2: The video is playing in fast forward.", "video-llm-prediction": "Option 1: The video is playing at a regular pace.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing in fast forward.\nCaption B: The speed of the video is normal speed.", "gt-answer": "Caption A: The video is playing in fast forward.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is in slow motion.\nSentence B: The video is playing in fast forward.", "gt-answer": "Sentence B: The video is playing in fast forward.", "video-llm-prediction": "Sentence A: The video is in slow motion.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The leaves are changing color from green to yellow.\nCaption B: The leaves are changing color from yellow to green.", "gt-answer": "Caption A: The leaves are changing color from green to yellow.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The leaves are changing color from yellow to green.\nSentence B: The leaves are changing color from green to yellow.", "gt-answer": "Sentence B: The leaves are changing color from green to yellow.", "video-llm-prediction": "Sentence A: The leaves are changing color from yellow to green.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The leaves are changing color from yellow to green.\nOption 2: The leaves are changing color from green to yellow.", "gt-answer": "Option 2: The leaves are changing color from green to yellow.", "video-llm-prediction": "Option 1: The leaves are changing color from yellow to green.", "match_success": true, "rating": 0 } ] }, "1084153195": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The dolphins are diving.\nCaption B: The dolphins are swimming.", "gt-answer": "Caption B: The dolphins are swimming.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The dolphins are swimming.\nOption 2: The dolphins are sleeping.", "gt-answer": "Option 1: The dolphins are swimming.", "video-llm-prediction": "Option 1: The dolphins are swimming.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dolphins are jumping.\nSentence B: The dolphins are swimming.", "gt-answer": "Sentence B: The dolphins are swimming.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The dolphins are hovering in one place.\nCaption B: The dolphins are swimming towards the shore.", "gt-answer": "Caption B: The dolphins are swimming towards the shore.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dolphins are swimming away from the shore.\nSentence B: The dolphins are swimming towards the shore.", "gt-answer": "Sentence B: The dolphins are swimming towards the shore.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The dolphins are swimming towards the shore.\nOption 2: The dolphins are swimming parallel to the shore.", "gt-answer": "Option 1: The dolphins are swimming towards the shore.", "video-llm-prediction": "Option 2: The dolphins are swimming parallel to the shore.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Which caption matches the video better?\nCaption A: The rate of movement in the video is normal speed.\nCaption B: The rate of movement in the video is fast speed.", "gt-answer": "Caption A: The rate of movement in the video is normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The rate of movement in the video is no speed.\nSentence B: The rate of movement in the video is normal speed.", "gt-answer": "Sentence B: The rate of movement in the video is normal speed.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The rate of movement in the video is normal speed.\nOption 2: The rate of movement in the video is slow speed.", "gt-answer": "Option 1: The rate of movement in the video is normal speed.", "video-llm-prediction": "Option 2: The rate of movement in the video is slow speed.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The dolphins swim in circles.\nCaption B: The dolphins swim towards the shore, then get fed with fish.", "gt-answer": "Caption B: The dolphins swim towards the shore, then get fed with fish.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dolphins swim towards the shore, then get fed with fish.\nSentence B: The dolphins get fed with fish, then swim towards the shore.", "gt-answer": "Sentence A: The dolphins swim towards the shore, then get fed with fish.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The dolphins swim towards the shore, then get fed with fish.\nOption 2: Getting fed with fish is the first event that happens to the dolphins.", "gt-answer": "Option 1: The dolphins swim towards the shore, then get fed with fish.", "video-llm-prediction": "Option 2: Getting fed with fish is the first event that happens to the dolphins.", "match_success": true, "rating": 0 } ] }, "1054717541": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is kneading dough.\nSentence B: The person is cutting dough.", "gt-answer": "Sentence A: A person is kneading dough.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is grilling dough.\nOption 2: A person is kneading dough.", "gt-answer": "Option 2: A person is kneading dough.", "video-llm-prediction": "Option 2: A person is kneading dough.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The person is throwing dough.\nCaption B: A person is kneading dough.", "gt-answer": "Caption B: A person is kneading dough.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at normal speed.\nSentence B: The video is playing in slow motion.", "gt-answer": "Sentence B: The video is playing in slow motion.", "video-llm-prediction": "Sentence B: The video is playing in slow motion.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing in slow motion.\nCaption B: The video is playing with a time-lapse effect.", "gt-answer": "Caption A: The video is playing in slow motion.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing in slow motion.\nOption 2: The tempo of the video playback is fast.", "gt-answer": "Option 1: The video is playing in slow motion.", "video-llm-prediction": "Option 1: The video is playing in slow motion.", "match_success": true, "rating": 1 } ] }, "1081092839": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The sun is descending.\nCaption B: The sun is ascending.", "gt-answer": "Caption A: The sun is descending.", "video-llm-prediction": "Caption B: The sun is ascending.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun is moving upwards.\nSentence B: The sun is moving downwards.", "gt-answer": "Sentence B: The sun is moving downwards.", "video-llm-prediction": "Sentence A: The sun is moving upwards.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun is descending.\nOption 2: The sun is rising.", "gt-answer": "Option 1: The sun is descending.", "video-llm-prediction": "Option 2: The sun is rising.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is in slow motion.\nOption 2: The video is in time-lapse.", "gt-answer": "Option 2: The video is in time-lapse.", "video-llm-prediction": "Option 2: The video is in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is in time-lapse.\nSentence B: The speed of the video is normal.", "gt-answer": "Sentence A: The video is in time-lapse.", "video-llm-prediction": "Sentence A: The video is in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is in time-lapse.\nCaption B: The video has a fast pace.", "gt-answer": "Caption A: The video is in time-lapse.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1059462749": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The person is reading a book.\nCaption B: The person is climbing down a ladder.", "gt-answer": "Caption B: The person is climbing down a ladder.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is cooking.\nOption 2: The person is climbing down a ladder.", "gt-answer": "Option 2: The person is climbing down a ladder.", "video-llm-prediction": "Option 2: The person is climbing down a ladder.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is riding a bike.\nSentence B: The person is climbing down a ladder.", "gt-answer": "Sentence B: The person is climbing down a ladder.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is moving downwards.\nSentence B: The person is moving rightwards.", "gt-answer": "Sentence A: The person is moving downwards.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is moving downwards.\nOption 2: The person is moving upwards.", "gt-answer": "Option 1: The person is moving downwards.", "video-llm-prediction": "Option 2: The person is moving upwards.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person is moving downwards.\nCaption B: The person is moving leftwards.", "gt-answer": "Caption A: The person is moving downwards.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing at normal speed.\nSentence B: The video is playing in time-lapse.", "gt-answer": "Sentence A: The video is playing at normal speed.", "video-llm-prediction": "Sentence B: The video is playing in time-lapse.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at normal speed.\nOption 2: The video is playing slowly.", "gt-answer": "Option 1: The video is playing at normal speed.", "video-llm-prediction": "Option 1: The video is playing at normal speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing quickly.\nCaption B: The video is playing at normal speed.", "gt-answer": "Caption B: The video is playing at normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1077590324": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A woman is cooking.\nOption 2: The woman is doing laundry.", "gt-answer": "Option 2: The woman is doing laundry.", "video-llm-prediction": "Option 2: The woman is doing laundry.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is doing laundry.\nSentence B: The woman is singing.", "gt-answer": "Sentence A: The woman is doing laundry.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is doing laundry.\nCaption B: The woman is painting.", "gt-answer": "Caption A: The woman is doing laundry.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the entire video is slow motion.\nSentence B: The entire video is in normal speed.", "gt-answer": "Sentence B: The entire video is in normal speed.", "video-llm-prediction": "Sentence A: The speed of the entire video is slow motion.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The entire video is in normal speed.\nOption 2: The video is playing in high speed.", "gt-answer": "Option 1: The entire video is in normal speed.", "video-llm-prediction": "Option 1: The entire video is in normal speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The velocity of the video playback is low speed.\nCaption B: The entire video is in normal speed.", "gt-answer": "Caption B: The entire video is in normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The woman is putting clothes into the washing machine and then standing up to operate it.\nCaption B: The woman is sitting down to operate the washing machine and then putting clothes into it.", "gt-answer": "Caption A: The woman is putting clothes into the washing machine and then standing up to operate it.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is putting clothes into the washing machine and then standing up to operate it.\nSentence B: The woman is operating the washing machine and then putting clothes into it.", "gt-answer": "Sentence A: The woman is putting clothes into the washing machine and then standing up to operate it.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is putting clothes into the washing machine and then standing up to operate it.\nOption 2: The woman is turning off the washing machine and then getting dressed.", "gt-answer": "Option 1: The woman is putting clothes into the washing machine and then standing up to operate it.", "video-llm-prediction": "Option 1: The woman is putting clothes into the washing machine and then standing up to operate it.", "match_success": true, "rating": 1 } ] }, "1040541401": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The children are painting pictures.\nSentence B: The children are doing chemical experiments.", "gt-answer": "Sentence B: The children are doing chemical experiments.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The children are reading books.\nOption 2: The children are doing chemical experiments.", "gt-answer": "Option 2: The children are doing chemical experiments.", "video-llm-prediction": "Option 2: The children are doing chemical experiments.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The children are doing chemical experiments.\nCaption B: The children are playing soccer.", "gt-answer": "Caption A: The children are doing chemical experiments.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is in time-lapse.\nSentence B: The video is playing at normal speed.", "gt-answer": "Sentence B: The video is playing at normal speed.", "video-llm-prediction": "Sentence A: The video is in time-lapse.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at normal speed.\nOption 2: The video is playing in super slow motion.", "gt-answer": "Option 1: The video is playing at normal speed.", "video-llm-prediction": "Option 1: The video is playing at normal speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing at normal speed.\nCaption B: The video is playing very slow.", "gt-answer": "Caption A: The video is playing at normal speed.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1059072773": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The ice cream is melting.\nCaption B: The ice cream is freezing.", "gt-answer": "Caption A: The ice cream is melting.", "video-llm-prediction": "Caption A: The ice cream is melting.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ice cream is evaporating.\nOption 2: The ice cream is melting.", "gt-answer": "Option 2: The ice cream is melting.", "video-llm-prediction": "Option 2: The ice cream is melting.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream is melting.\nSentence B: The ice cream is solidifying.", "gt-answer": "Sentence A: The ice cream is melting.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 } ] }, "1064645467": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is cooking.\nOption 2: The man is doing exercise.", "gt-answer": "Option 2: The man is doing exercise.", "video-llm-prediction": "Option 2: The man is doing exercise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A video showing the man reading a book.\nSentence B: The man is doing exercise.", "gt-answer": "Sentence B: The man is doing exercise.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is swimming.\nCaption B: The man is doing exercise.", "gt-answer": "Caption B: The man is doing exercise.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at normal speed.\nOption 2: The video is playing in slow motion.", "gt-answer": "Option 1: The video is playing at normal speed.", "video-llm-prediction": "Option 2: The video is playing in slow motion.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing at normal speed.\nCaption B: The video is playing at a fast speed.", "gt-answer": "Caption A: The video is playing at normal speed.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the video is time-lapse.\nSentence B: The video is playing at normal speed.", "gt-answer": "Sentence B: The video is playing at normal speed.", "video-llm-prediction": "Sentence A: The video is playing at normal speed.", "match_success": false, "chatgpt-response": "Incorrect", "rating": 0 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man takes off his jacket and then jumps up to grab the bar.\nOption 2: The man jumps up to grab the bar before taking off his jacket.", "gt-answer": "Option 1: The man takes off his jacket and then jumps up to grab the bar.", "video-llm-prediction": "Option 2: The man jumps up to grab the bar before taking off his jacket.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The man takes off his jacket and then jumps up to grab the bar.\nCaption B: The man takes off his jacket after jumping down from the bar.", "gt-answer": "Caption A: The man takes off his jacket and then jumps up to grab the bar.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man takes off his jacket and then jumps up to grab the bar.\nSentence B: The man jumps down from the bar and then puts on his jacket.", "gt-answer": "Sentence A: The man takes off his jacket and then jumps up to grab the bar.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1088279109": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The elevator is rising.\nSentence B: The elevator is going down.", "gt-answer": "Sentence A: The elevator is rising.", "video-llm-prediction": "Sentence A: The elevator is rising.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The elevator is staying still.\nCaption B: The elevator is rising.", "gt-answer": "Caption B: The elevator is rising.", "video-llm-prediction": "Caption B: The elevator is rising.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The elevator is rising.\nOption 2: The elevator is not moving.", "gt-answer": "Option 1: The elevator is rising.", "video-llm-prediction": "Option 2: The elevator is not moving.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Which caption matches the video better?\nCaption A: The video is playing at normal speed.\nCaption B: The video is in slow motion.", "gt-answer": "Caption A: The video is playing at normal speed.", "video-llm-prediction": "Caption B: The video is in slow motion.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is being played in fast forward mode.\nOption 2: The video is playing at normal speed.", "gt-answer": "Option 2: The video is playing at normal speed.", "video-llm-prediction": "Option 2: The video is playing at normal speed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is on pause.\nSentence B: The video is playing at normal speed.", "gt-answer": "Sentence B: The video is playing at normal speed.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1093573255": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is running in time-lapse.\nOption 2: The video is running at normal speed.", "gt-answer": "Option 1: The video is running in time-lapse.", "video-llm-prediction": "Option 1: The video is running in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is in slow motion.\nSentence B: The video is running in time-lapse.", "gt-answer": "Sentence B: The video is running in time-lapse.", "video-llm-prediction": "Sentence B: The video is running in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is running steadily.\nCaption B: The video is running in time-lapse.", "gt-answer": "Caption B: The video is running in time-lapse.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The plant is reviving.\nOption 2: The plant is wilting.", "gt-answer": "Option 1: The plant is reviving.", "video-llm-prediction": "Option 1: The plant is reviving.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The plant is decaying.\nSentence B: The plant is reviving.", "gt-answer": "Sentence B: The plant is reviving.", "video-llm-prediction": "Sentence B: The plant is reviving.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The plant is reviving.\nCaption B: The plant is wilting.", "gt-answer": "Caption A: The plant is reviving.", "video-llm-prediction": "Caption A: The plant is reviving.", "match_success": true, "rating": 1 } ] }, "1105233293": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The people in the video are swimming.\nSentence B: The people in the video are playing basketball.", "gt-answer": "Sentence B: The people in the video are playing basketball.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The people in the video are playing basketball.\nCaption B: The people in the video are dancing.", "gt-answer": "Caption A: The people in the video are playing basketball.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people in the video are sleeping.\nOption 2: The people in the video are playing basketball.", "gt-answer": "Option 2: The people in the video are playing basketball.", "video-llm-prediction": "Option 2: The people in the video are playing basketball.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at accelerated speed.\nOption 2: The video is playing at normal speed.", "gt-answer": "Option 2: The video is playing at normal speed.", "video-llm-prediction": "Option 2: The video is playing at normal speed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing in reverse.\nSentence B: The video is playing at normal speed.", "gt-answer": "Sentence B: The video is playing at normal speed.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing at normal speed.\nCaption B: The video is in slow-motion.", "gt-answer": "Caption A: The video is playing at normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The players are passing the ball to each other and then shooting the basketball.\nSentence B: The players are shooting the basketball and then blocking the opponent.", "gt-answer": "Sentence A: The players are passing the ball to each other and then shooting the basketball.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The players are passing the ball to each other and then shooting the basketball.\nCaption B: The players are shooting the basketball and then dribbling the ball.", "gt-answer": "Caption A: The players are passing the ball to each other and then shooting the basketball.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The players are passing the ball to each other and then shooting the basketball.\nOption 2: The players are passing the ball to each other and then blocking the opponent.", "gt-answer": "Option 1: The players are passing the ball to each other and then shooting the basketball.", "video-llm-prediction": "Option 1: The players are passing the ball to each other and then shooting the basketball.", "match_success": true, "rating": 1 } ] }, "1077146132": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A woman is tossing and turning in the bed.\nSentence B: The woman is waking up in the video.", "gt-answer": "Sentence B: The woman is waking up in the video.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The woman is falling asleep.\nCaption B: The woman is waking up in the video.", "gt-answer": "Caption B: The woman is waking up in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is waking up in the video.\nOption 2: The woman is lying down on the bed.", "gt-answer": "Option 1: The woman is waking up in the video.", "video-llm-prediction": "Option 1: The woman is waking up in the video.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The first event in the sequence is getting out of bed.\nCaption B: The first event in the sequence is opening the curtains.", "gt-answer": "Caption A: The first event in the sequence is getting out of bed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Closing the curtains occurs before getting into bed.\nOption 2: The first event in the sequence is getting out of bed.", "gt-answer": "Option 2: The first event in the sequence is getting out of bed.", "video-llm-prediction": "Option 1: Closing the curtains occurs before getting into bed.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman closes the curtais and then gets into bed.\nSentence B: The first event in the sequence is getting out of bed.", "gt-answer": "Sentence B: The first event in the sequence is getting out of bed.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is turning darker.\nOption 2: The video is turning brighter.", "gt-answer": "Option 2: The video is turning brighter.", "video-llm-prediction": "Option 2: The video is turning brighter.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is staying the same brightness.\nSentence B: The video is turning brighter.", "gt-answer": "Sentence B: The video is turning brighter.", "video-llm-prediction": "Sentence B: The video is turning brighter.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is decreasing in brightness.\nCaption B: The video is turning brighter.", "gt-answer": "Caption B: The video is turning brighter.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1086688682": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The traffic lights are changing from red to yellow.\nSentence B: The traffic lights are changing from red to green.", "gt-answer": "Sentence B: The traffic lights are changing from red to green.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The traffic lights are changing from yellow to red.\nCaption B: The traffic lights are changing from red to green.", "gt-answer": "Caption B: The traffic lights are changing from red to green.", "video-llm-prediction": "Caption B: The traffic lights are changing from red to green.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The traffic lights are changing from green to red.\nOption 2: The traffic lights are changing from red to green.", "gt-answer": "Option 2: The traffic lights are changing from red to green.", "video-llm-prediction": "Option 1: The traffic lights are changing from green to red.", "match_success": true, "rating": 0 } ] }, "1096612823": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The car is sliding on ice.\nCaption B: The car is driving on the road.", "gt-answer": "Caption B: The car is driving on the road.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The car is dancing on the rooftop.\nSentence B: The car is driving on the road.", "gt-answer": "Sentence B: The car is driving on the road.", "video-llm-prediction": "Sentence B: The car is driving on the road.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The car is driving on the road.\nOption 2: The car is buried in the sand.", "gt-answer": "Option 1: The car is driving on the road.", "video-llm-prediction": "Option 1: The car is driving on the road.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is zooming in.\nOption 2: The video is zooming out.", "gt-answer": "Option 1: The video is zooming in.", "video-llm-prediction": "Option 2: The video is zooming out.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is zooming in.\nCaption B: The video is rotating.", "gt-answer": "Caption A: The video is zooming in.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is zooming in.\nSentence B: The video is panning left.", "gt-answer": "Sentence A: The video is zooming in.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1075484900": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The child is turning away from the man.\nSentence B: The child is turning towards the man.", "gt-answer": "Sentence A: The child is turning away from the man.", "video-llm-prediction": "Sentence B: The child is turning towards the man.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The child is turning towards the man.\nOption 2: The child is turning away from the man.", "gt-answer": "Option 2: The child is turning away from the man.", "video-llm-prediction": "Option 1: The child is turning towards the man.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The child is moving forward in relation to the man.\nCaption B: The child is turning away from the man.", "gt-answer": "Caption B: The child is turning away from the man.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1090578917": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is painting a picture.\nSentence B: The man is playing soccer.", "gt-answer": "Sentence B: The man is playing soccer.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is reading a book.\nOption 2: The man is playing soccer.", "gt-answer": "Option 2: The man is playing soccer.", "video-llm-prediction": "Option 2: The man is playing soccer.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is playing soccer.\nCaption B: The man is cooking dinner.", "gt-answer": "Caption A: The man is playing soccer.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man stands up from the ground, then leaps to his right.\nSentence B: The man is leaping to his right and then standing up.", "gt-answer": "Sentence B: The man is leaping to his right and then standing up.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person is standing up from the ground and then leaping to this right.\nOption 2: The man is leaping to his right and then standing up.", "gt-answer": "Option 2: The man is leaping to his right and then standing up.", "video-llm-prediction": "Option 1: A person is standing up from the ground and then leaping to this right.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The man is leaping to his right after standing up.\nCaption B: The man is leaping to his right and then standing up.", "gt-answer": "Caption B: The man is leaping to his right and then standing up.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The man is leaping to his left.\nCaption B: The man is leaping to his right.", "gt-answer": "Caption B: The man is leaping to his right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is leaping to his right.\nSentence B: The man is leaping backward.", "gt-answer": "Sentence A: The man is leaping to his right.", "video-llm-prediction": "Sentence A: The man is leaping to his right.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is leaping to his right.\nOption 2: The man is leaping forward.", "gt-answer": "Option 1: The man is leaping to his right.", "video-llm-prediction": "Option 2: The man is leaping forward.", "match_success": true, "rating": 0 } ] }, "1075338140": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ball is rolling from right to left.\nSentence B: The ball is rolling from left to right.", "gt-answer": "Sentence B: The ball is rolling from left to right.", "video-llm-prediction": "Sentence B: The ball is rolling from left to right.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The ball is rolling from left to right.\nCaption B: The ball is rolling from right to left.", "gt-answer": "Caption A: The ball is rolling from left to right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ball is rolling from right to left.\nOption 2: The ball is rolling from left to right.", "gt-answer": "Option 2: The ball is rolling from left to right.", "video-llm-prediction": "Option 2: The ball is rolling from left to right.", "match_success": true, "rating": 1 } ] }, "1067268403": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The wind turbines are stationary.\nCaption B: The wind turbines are rotating clockwise.", "gt-answer": "Caption B: The wind turbines are rotating clockwise.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The wind turbines are rotating counterclockwise.\nSentence B: The wind turbines are rotating clockwise.", "gt-answer": "Sentence B: The wind turbines are rotating clockwise.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The wind turbines are rotating counterclockwise.\nOption 2: The wind turbines are rotating clockwise.", "gt-answer": "Option 2: The wind turbines are rotating clockwise.", "video-llm-prediction": "Option 1: The wind turbines are rotating counterclockwise.", "match_success": true, "rating": 0 } ] }, "1072594556": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The car in the center of the screen is moving faster than other cars.\nOption 2: The car in the center of the screen is moving at the same speed as other cars.", "gt-answer": "Option 1: The car in the center of the screen is moving faster than other cars.", "video-llm-prediction": "Option 1: The car in the center of the screen is moving faster than other cars.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The car in the center of the screen is moving slower than other cars.\nSentence B: The car in the center of the screen is moving faster than other cars.", "gt-answer": "Sentence B: The car in the center of the screen is moving faster than other cars.", "video-llm-prediction": "Sentence B: The car in the center of the screen is moving faster than other cars.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the car in the center of the screen is unknown.\nCaption B: The car in the center of the screen is moving faster than other cars.", "gt-answer": "Caption B: The car in the center of the screen is moving faster than other cars.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1096007487": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3d cloud is moving upward from the camera's point of view.\nSentence B: The 3d cloud is moving leftward from the camera's point of view.", "gt-answer": "Sentence B: The 3d cloud is moving leftward from the camera's point of view.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The 3d cloud is moving downward from the camera's point of view.\nCaption B: The 3d cloud is moving leftward from the camera's point of view.", "gt-answer": "Caption B: The 3d cloud is moving leftward from the camera's point of view.", "video-llm-prediction": "Caption B: The 3d cloud is moving leftward from the camera's point of view.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3d cloud is moving rightward from the camera's point of view.\nOption 2: The 3d cloud is moving leftward from the camera's point of view.", "gt-answer": "Option 2: The 3d cloud is moving leftward from the camera's point of view.", "video-llm-prediction": "Option 1: The 3d cloud is moving rightward from the camera's point of view.", "match_success": true, "rating": 0 } ] }, "1095939659": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The light is growing clockwise.\nCaption B: The light is growing downwards.", "gt-answer": "Caption A: The light is growing clockwise.", "video-llm-prediction": "Caption A: The light is growing clockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The light is growing counterclockwise.\nSentence B: The light is growing clockwise.", "gt-answer": "Sentence B: The light is growing clockwise.", "video-llm-prediction": "Sentence A: The light is growing counterclockwise.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The light is growing clockwise.\nOption 2: The light is moving straight forward.", "gt-answer": "Option 1: The light is growing clockwise.", "video-llm-prediction": "Option 1: The light is growing clockwise.", "match_success": true, "rating": 1 } ] }, "1059632327": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The tennis ball is bouncing up and down.\nOption 2: The tennis ball is spinning clockwise and anticlockwise.", "gt-answer": "Option 1: The tennis ball is bouncing up and down.", "video-llm-prediction": "Option 1: The tennis ball is bouncing up and down.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The tennis ball is rolling forward and backward.\nSentence B: The tennis ball is bouncing up and down.", "gt-answer": "Sentence B: The tennis ball is bouncing up and down.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The tennis ball is bouncing left to right.\nCaption B: The tennis ball is bouncing up and down.", "gt-answer": "Caption B: The tennis ball is bouncing up and down.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1098785169": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The galaxy is spinning counterclockwise.\nCaption B: The galaxy is rotating clockwise.", "gt-answer": "Caption B: The galaxy is rotating clockwise.", "video-llm-prediction": "Caption B: The galaxy is rotating clockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The galaxy's spin is counterclockwise.\nSentence B: The galaxy is rotating clockwise.", "gt-answer": "Sentence B: The galaxy is rotating clockwise.", "video-llm-prediction": "Sentence A: The galaxy's spin is counterclockwise.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The rotation of the galaxy is counterclockwise.\nOption 2: The galaxy is rotating clockwise.", "gt-answer": "Option 2: The galaxy is rotating clockwise.", "video-llm-prediction": "Option 1: The galaxy is rotating counterclockwise.", "match_success": false, "chatgpt-response": "Incorrect", "rating": 0 } ] }, "1099984801": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The clouds are moving away from the camera.\nSentence B: The clouds are moving towards the camera.", "gt-answer": "Sentence B: The clouds are moving towards the camera.", "video-llm-prediction": "Sentence B: The clouds are moving towards the camera.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The clouds are moving towards the camera.\nOption 2: The clouds are staying still.", "gt-answer": "Option 1: The clouds are moving towards the camera.", "video-llm-prediction": "Option 2: The clouds are staying still.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The clouds are moving away from the camera.\nCaption B: The clouds are moving towards the camera.", "gt-answer": "Caption B: The clouds are moving towards the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is set to time-lapse speed.\nOption 2: The video is in slow motion.", "gt-answer": "Option 1: The video is set to time-lapse speed.", "video-llm-prediction": "Option 1: The video is set to time-lapse speed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is set to time-lapse speed.\nSentence B: The video is set to real-time speed.", "gt-answer": "Sentence A: The video is set to time-lapse speed.", "video-llm-prediction": "Sentence B: The video is set to real-time speed.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is set to time-lapse speed.\nCaption B: The video is dilated in time.", "gt-answer": "Caption A: The video is set to time-lapse speed.", "video-llm-prediction": "Caption A: The video is set to time-lapse speed.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The brightness of the video is staying the same.\nOption 2: The entire video is getting darker.", "gt-answer": "Option 2: The entire video is getting darker.", "video-llm-prediction": "Option 2: The entire video is getting darker.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The entire video is getting darker.\nCaption B: The video is getting brighter.", "gt-answer": "Caption A: The entire video is getting darker.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The entire video is getting darker.\nSentence B: The entire video is getting brighter.", "gt-answer": "Sentence A: The entire video is getting darker.", "video-llm-prediction": "Sentence A: The entire video is getting darker.", "match_success": true, "rating": 1 } ] }, "1082419672": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The movement in the video is flying upwards relative to the ship.\nOption 2: The movement in the video is flying backwards relative to the ship.", "gt-answer": "Option 2: The movement in the video is flying backwards relative to the ship.", "video-llm-prediction": "Option 1: The movement in the video is flying upwards relative to the ship.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The movement in the video is flying backwards relative to the ship.\nSentence B: The movement in the video is flying forwards relative to the ship.", "gt-answer": "Sentence A: The movement in the video is flying backwards relative to the ship.", "video-llm-prediction": "Sentence A: The movement in the video is flying backwards relative to the ship.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The movement in the video is flying backwards relative to the ship.\nCaption B: The movement in the video is flying forwards relative to the ship.", "gt-answer": "Caption A: The movement in the video is flying backwards relative to the ship.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1058985719": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The airplane is moving from right to left.\nCaption B: The airplane is flying from bottom to top.", "gt-answer": "Caption B: The airplane is flying from bottom to top.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The airplane is flying from bottom to top.\nOption 2: The airplane is flying from top to bottom.", "gt-answer": "Option 1: The airplane is flying from bottom to top.", "video-llm-prediction": "Option 2: The airplane is flying from top to bottom.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The airplane is flying from bottom to top.\nSentence B: The airplane is moving from left to right.", "gt-answer": "Sentence A: The airplane is flying from bottom to top.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1055413730": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The planet Earth is spinning to the left.\nOption 2: The planet Earth is spinning to the right.", "gt-answer": "Option 2: The planet Earth is spinning to the right.", "video-llm-prediction": "Option 2: The planet Earth is spinning to the right.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The planet Earth is spinning to the right.\nCaption B: The Earth is rotating upward.", "gt-answer": "Caption A: The planet Earth is spinning to the right.", "video-llm-prediction": "Caption A: The planet Earth is spinning to the right.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The planet Earth is spinning to the left.\nSentence B: The planet Earth is spinning to the right.", "gt-answer": "Sentence B: The planet Earth is spinning to the right.", "video-llm-prediction": "Sentence A: The planet Earth is spinning to the left.", "match_success": true, "rating": 0 } ] }, "1081684532": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The asteroids in the video are flying towards the camera.\nSentence B: The asteroids are flying away from the camera.", "gt-answer": "Sentence A: The asteroids in the video are flying towards the camera.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The asteroids in the video are flying towards the camera.\nOption 2: The asteroids are flying to the left.", "gt-answer": "Option 1: The asteroids in the video are flying towards the camera.", "video-llm-prediction": "Option 1: The asteroids in the video are flying towards the camera.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The asteroids are flying to the right.\nCaption B: The asteroids in the video are flying towards the camera.", "gt-answer": "Caption B: The asteroids in the video are flying towards the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "23391142": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The people in the video are dancing.\nCaption B: The people in the video are playing badminton.", "gt-answer": "Caption B: The people in the video are playing badminton.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The people in the video are playing badminton.\nSentence B: The people are reading books.", "gt-answer": "Sentence A: The people in the video are playing badminton.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people in the video are playing badminton.\nOption 2: The people in the video are playing soccer.", "gt-answer": "Option 1: The people in the video are playing badminton.", "video-llm-prediction": "Option 1: The people in the video are playing badminton.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is panning upwards.\nOption 2: The video is panning to the right.", "gt-answer": "Option 2: The video is panning to the right.", "video-llm-prediction": "Option 2: The video is panning to the right.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is zooming in.\nCaption B: The video is panning to the right.", "gt-answer": "Caption B: The video is panning to the right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is panning to the right.\nSentence B: The video is panning to the left.", "gt-answer": "Sentence A: The video is panning to the right.", "video-llm-prediction": "Sentence A: The video is panning to the right.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing at normal speed.\nOption 2: The video is playing in slow motion.", "gt-answer": "Option 2: The video is playing in slow motion.", "video-llm-prediction": "Option 1: The video is playing at normal speed.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing in slow motion.\nCaption B: The video is playing in time-lapse.", "gt-answer": "Caption A: The video is playing in slow motion.", "video-llm-prediction": "Caption B: The video is playing in time-lapse.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing in slow motion.\nSentence B: The video is playing quickly.", "gt-answer": "Sentence A: The video is playing in slow motion.", "video-llm-prediction": "Sentence A: The video is playing in slow motion.", "match_success": true, "rating": 1 } ] }, "1078368947": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is washing her face in the bathroom.\nOption 2: A woman is reading a book in the bathroom.", "gt-answer": "Option 2: A woman is reading a book in the bathroom.", "video-llm-prediction": "Option 2: A woman is reading a book in the bathroom.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A woman is reading a book in the bathroom.\nSentence B: The woman is taking a shower in the bathroom.", "gt-answer": "Sentence A: A woman is reading a book in the bathroom.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is washing her hair in the bathroom.\nCaption B: A woman is reading a book in the bathroom.", "gt-answer": "Caption B: A woman is reading a book in the bathroom.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1099738787": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The concrete wall is falling apart.\nCaption B: The concrete wall is assembling together.", "gt-answer": "Caption A: The concrete wall is falling apart.", "video-llm-prediction": "Caption B: The concrete wall is assembling together.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The concrete wall is falling apart.\nOption 2: The concrete wall is growing taller.", "gt-answer": "Option 1: The concrete wall is falling apart.", "video-llm-prediction": "Option 1: The concrete wall is falling apart.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The concrete wall is assembling together.\nSentence B: The concrete wall is falling apart.", "gt-answer": "Sentence B: The concrete wall is falling apart.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1094219575": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is played in normal speed.\nSentence B: The video is played in time-lapse mode.", "gt-answer": "Sentence B: The video is played in time-lapse mode.", "video-llm-prediction": "Sentence B: The video is played in time-lapse mode.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is played in time-lapse mode.\nOption 2: The video is played in slow motion.", "gt-answer": "Option 1: The video is played in time-lapse mode.", "video-llm-prediction": "Option 1: The video is played in time-lapse mode.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is played in fast forwarding mode.\nCaption B: The video is played in time-lapse mode.", "gt-answer": "Caption B: The video is played in time-lapse mode.", "video-llm-prediction": "Caption B: The video is played in time-lapse mode.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The flowers are blooming.\nCaption B: The flowers are wilting.", "gt-answer": "Caption B: The flowers are wilting.", "video-llm-prediction": "Caption B: The flowers are wilting.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The flowers are blooming.\nOption 2: The flowers are wilting.", "gt-answer": "Option 2: The flowers are wilting.", "video-llm-prediction": "Option 1: The flowers are blooming.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The flowers are wilting.\nSentence B: The flowers are blooming.", "gt-answer": "Sentence A: The flowers are wilting.", "video-llm-prediction": "Sentence B: The flowers are blooming.", "match_success": true, "rating": 0 } ] }, "1053758117": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The camera is standing still before a 3D digital brain.\nCaption B: The camera is zooming into a 3D digital brain.", "gt-answer": "Caption B: The camera is zooming into a 3D digital brain.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is zooming out from a 3D digital brain.\nOption 2: The camera is zooming into a 3D digital brain.", "gt-answer": "Option 2: The camera is zooming into a 3D digital brain.", "video-llm-prediction": "Option 2: The camera is zooming into a 3D digital brain.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming into a 3D digital brain.\nSentence B: The camera is moving downwards.", "gt-answer": "Sentence A: The camera is zooming into a 3D digital brain.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1069717165": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman shakes her head, followed by nodding.\nOption 2: The woman nods her head repeatedly.", "gt-answer": "Option 1: The woman shakes her head, followed by nodding.", "video-llm-prediction": "Option 2: The woman nods her head repeatedly.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The woman shakes her head, followed by nodding.\nCaption B: After shaking her head, the woman feels sad.", "gt-answer": "Caption A: The woman shakes her head, followed by nodding.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman shakes her head, followed by nodding.\nSentence B: The woman shakes her head after nodding her head.", "gt-answer": "Sentence A: The woman shakes her head, followed by nodding.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1041584314": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The man's expression changes from serious to smiling.\nCaption B: The man doesn't change his expression.", "gt-answer": "Caption A: The man's expression changes from serious to smiling.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man's expression changes from serious to smiling.\nSentence B: The man starts to smile before showing a serious expression.", "gt-answer": "Sentence A: The man's expression changes from serious to smiling.", "video-llm-prediction": "Sentence A: The man's expression changes from serious to smiling.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man's expression changes from serious to smiling.\nOption 2: The man never smiles.", "gt-answer": "Option 1: The man's expression changes from serious to smiling.", "video-llm-prediction": "Option 1: The man's expression changes from serious to smiling.", "match_success": true, "rating": 1 } ] }, "1067427023": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The video is playing at normal speed.\nCaption B: The video is playing in time-lapse.", "gt-answer": "Caption B: The video is playing in time-lapse.", "video-llm-prediction": "Caption B: The video is playing in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing in slow motion.\nSentence B: The video is playing in time-lapse.", "gt-answer": "Sentence B: The video is playing in time-lapse.", "video-llm-prediction": "Sentence A: The video is playing in slow motion.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing in time-lapse.\nOption 2: The speed of the video is unknown.", "gt-answer": "Option 1: The video is playing in time-lapse.", "video-llm-prediction": "Option 1: The video is playing in time-lapse.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The snow particles are melting.\nSentence B: The snow particles are solidifying.", "gt-answer": "Sentence A: The snow particles are melting.", "video-llm-prediction": "Sentence A: The snow particles are melting.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The snow particles are freezing.\nOption 2: The snow particles are melting.", "gt-answer": "Option 2: The snow particles are melting.", "video-llm-prediction": "Option 2: The snow particles are melting.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The snow particles are melting.\nCaption B: The snow particles are remaining the same.", "gt-answer": "Caption A: The snow particles are melting.", "video-llm-prediction": "Caption B: The snow particles are remaining the same.", "match_success": true, "rating": 0 } ] }, "1093948229": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The golden particles are exploding.\nSentence B: The golden particles are disappearing.", "gt-answer": "Sentence A: The golden particles are exploding.", "video-llm-prediction": "Sentence A: The golden particles are exploding.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The golden particles are exploding.\nOption 2: The golden particles are shrinking.", "gt-answer": "Option 1: The golden particles are exploding.", "video-llm-prediction": "Option 1: The golden particles are exploding.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The golden particles are contracting.\nCaption B: The golden particles are exploding.", "gt-answer": "Caption B: The golden particles are exploding.", "video-llm-prediction": "Caption B: The golden particles are exploding.", "match_success": true, "rating": 1 } ] }, "1106668103": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is staying still.\nOption 2: The movement in the video is forward.", "gt-answer": "Option 2: The movement in the video is forward.", "video-llm-prediction": "Option 2: The movement in the video is forward.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The movement in the video is forward.\nCaption B: The movement in the video is backward.", "gt-answer": "Caption A: The movement in the video is forward.", "video-llm-prediction": "Caption A: The movement in the video is forward.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The movement in the video is forward.\nSentence B: The primary motion depicted in the video is turning in circles.", "gt-answer": "Sentence A: The movement in the video is forward.", "video-llm-prediction": "Sentence A: The movement in the video is forward.", "match_success": true, "rating": 1 } ] }, "1049965795": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The light bulb is turning off.\nSentence B: The light bulb is lighting up.", "gt-answer": "Sentence B: The light bulb is lighting up.", "video-llm-prediction": "Sentence B: The light bulb is lighting up.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The light bulb is breaking.\nCaption B: The light bulb is lighting up.", "gt-answer": "Caption B: The light bulb is lighting up.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The light bulb is rapidly changing color.\nOption 2: The light bulb is lighting up.", "gt-answer": "Option 2: The light bulb is lighting up.", "video-llm-prediction": "Option 1: The light bulb is rapidly changing color.", "match_success": true, "rating": 0 } ] }, "1052364490": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The digital bar chart is growing.\nSentence B: The digital bar chart is staying in the same size.", "gt-answer": "Sentence A: The digital bar chart is growing.", "video-llm-prediction": "Sentence A: The digital bar chart is growing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The digital bar chart is growing.\nCaption B: The digital bar chart is shrinking.", "gt-answer": "Caption A: The digital bar chart is growing.", "video-llm-prediction": "Caption B: The digital bar chart is shrinking.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The digital bar chart is decreasing.\nOption 2: The digital bar chart is growing.", "gt-answer": "Option 2: The digital bar chart is growing.", "video-llm-prediction": "Option 1: The digital bar chart is decreasing.", "match_success": true, "rating": 0 } ] }, "1080990179": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The apple is shrinking and drying out.\nCaption B: The apple is ripening.", "gt-answer": "Caption A: The apple is shrinking and drying out.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The apple is shrinking and drying out.\nSentence B: The apple is growing bigger.", "gt-answer": "Sentence A: The apple is shrinking and drying out.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The apple is becoming juicier.\nOption 2: The apple is shrinking and drying out.", "gt-answer": "Option 2: The apple is shrinking and drying out.", "video-llm-prediction": "Option 2: The apple is shrinking and drying out.", "match_success": true, "rating": 1 } ] }, "1057163434": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The chef is removing the bread from the top of the burger.\nCaption B: The chef is putting the bread on top of the burger.", "gt-answer": "Caption B: The chef is putting the bread on top of the burger.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The chef is putting the bread on top of the burger.\nOption 2: The chef is removing the bread from the top of the burger.", "gt-answer": "Option 1: The chef is putting the bread on top of the burger.", "video-llm-prediction": "Option 1: The chef is putting the bread on top of the burger.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The chef is putting the bread on top of the burger.\nSentence B: The chef is removing the bread from the top of the burger.", "gt-answer": "Sentence A: The chef is putting the bread on top of the burger.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1085910917": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is drinking in the video.\nSentence B: The woman is sleeping.", "gt-answer": "Sentence A: The woman is drinking in the video.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is drinking in the video.\nCaption B: A woman is dancing in the video.", "gt-answer": "Caption A: The woman is drinking in the video.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is drinking in the video.\nOption 2: She is cooking.", "gt-answer": "Option 1: The woman is drinking in the video.", "video-llm-prediction": "Option 1: The woman is drinking in the video.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is turning back and then drinking a glass of water.\nSentence B: The person is drinking a glass of water and then turning back.", "gt-answer": "Sentence B: The person is drinking a glass of water and then turning back.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person is turning back and drinking a glass of water at the same time.\nCaption B: The person is drinking a glass of water and then turning back.", "gt-answer": "Caption B: The person is drinking a glass of water and then turning back.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is drinking a glass of water after turning back.\nOption 2: The person is drinking a glass of water and then turning back.", "gt-answer": "Option 2: The person is drinking a glass of water and then turning back.", "video-llm-prediction": "Option 2: The person is drinking a glass of water and then turning back.", "match_success": true, "rating": 1 } ] }, "1058907236": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The squirrel is sleeping.\nSentence B: The squirrel is foraging.", "gt-answer": "Sentence B: The squirrel is foraging.", "video-llm-prediction": "Sentence B: The squirrel is foraging.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The squirrel is swimming in the park.\nOption 2: The squirrel is foraging.", "gt-answer": "Option 2: The squirrel is foraging.", "video-llm-prediction": "Option 2: The squirrel is foraging.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The squirrel is foraging.\nCaption B: The squirrel is dancing in the park.", "gt-answer": "Caption A: The squirrel is foraging.", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The correct order of events is picking up a nut followed by turning back.\nCaption B: The correct order of events is picking up a nut after turning back.", "gt-answer": "Caption A: The correct order of events is picking up a nut followed by turning back.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The correct order of events is turning back to pick up a nut.\nOption 2: The correct order of events is picking up a nut followed by turning back.", "gt-answer": "Option 2: The correct order of events is picking up a nut followed by turning back.", "video-llm-prediction": "Option 1: The correct order of events is turning back to pick up a nut.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The squirrel is turning back followed by picking up a nut.\nSentence B: The correct order of events is picking up a nut followed by turning back.", "gt-answer": "Sentence B: The correct order of events is picking up a nut followed by turning back.", "video-llm-prediction": "Sentence A: The squirrel is turning back followed by picking up a nut.", "match_success": true, "rating": 0 } ] }, "1077575504": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The pile of salt is shrinking.\nOption 2: The pile of salt is growing.", "gt-answer": "Option 2: The pile of salt is growing.", "video-llm-prediction": "Option 1: The pile of salt is shrinking.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The pile of salt is melting.\nSentence B: The pile of salt is growing.", "gt-answer": "Sentence B: The pile of salt is growing.", "video-llm-prediction": "Sentence A: The pile of salt is melting.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The pile of salt is growing.\nCaption B: The pile of salt is disappearing.", "gt-answer": "Caption A: The pile of salt is growing.", "video-llm-prediction": "Caption B: The pile of salt is disappearing.", "match_success": true, "rating": 0 } ] }, "23370985": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice crystal is forming.\nSentence B: The ice crystal is shattering.", "gt-answer": "Sentence A: The ice crystal is forming.", "video-llm-prediction": "Sentence A: The ice crystal is forming.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The ice crystal is melting.\nCaption B: The ice crystal is forming.", "gt-answer": "Caption B: The ice crystal is forming.", "video-llm-prediction": "Caption B: The ice crystal is forming.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ice crystal is reducing in size.\nOption 2: The ice crystal is growing in size.", "gt-answer": "Option 2: The ice crystal is growing in size.", "video-llm-prediction": "Option 1: The ice crystal is reducing in size.", "match_success": true, "rating": 0 } ] }, "1100319395": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The circular pattern is moving counter-clockwise.\nCaption B: The circular pattern is moving clockwise.", "gt-answer": "Caption B: The circular pattern is moving clockwise.", "video-llm-prediction": "Caption B: The circular pattern is moving clockwise.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The circular pattern is moving clockwise.\nOption 2: The circular pattern is spinning counter-clockwise.", "gt-answer": "Option 1: The circular pattern is moving clockwise.", "video-llm-prediction": "Option 1: The circular pattern is moving clockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The circular pattern is vibrating back and forth.\nSentence B: The circular pattern is moving clockwise.", "gt-answer": "Sentence B: The circular pattern is moving clockwise.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1067268406": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: At the same speed as the camera, the car is moving.\nCaption B: The car is moving faster than the camera.", "gt-answer": "Caption B: The car is moving faster than the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The car is moving slower than the camera.\nSentence B: The car is moving faster than the camera.", "gt-answer": "Sentence B: The car is moving faster than the camera.", "video-llm-prediction": "Sentence A: The car is moving slower than the camera.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The car and the camera have the same speed.\nOption 2: The car is moving faster than the camera.", "gt-answer": "Option 2: The car is moving faster than the camera.", "video-llm-prediction": "Option 1: The car and the camera have the same speed.", "match_success": true, "rating": 0 } ] }, "1092682551": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The cars are traveling at the same speed as the camera.\nOption 2: The cars are traveling slower than the camera.", "gt-answer": "Option 2: The cars are traveling slower than the camera.", "video-llm-prediction": "Option 2: The cars are traveling slower than the camera.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The cars are traveling slower than the camera.\nSentence B: The cars are traveling faster than the camera.", "gt-answer": "Sentence A: The cars are traveling slower than the camera.", "video-llm-prediction": "Sentence A: The cars are traveling slower than the camera.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The cars are traveling slower than the camera.\nCaption B: The cars and the camera have the same speed.", "gt-answer": "Caption A: The cars are traveling slower than the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1101200293": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is moving counterclockwise around the aircraft carrier.\nSentence B: The camera is moving clockwise around the aircraft carrier.", "gt-answer": "Sentence B: The camera is moving clockwise around the aircraft carrier.", "video-llm-prediction": "Sentence A: The camera is moving counterclockwise around the aircraft carrier.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera is moving clockwise around the aircraft carrier.\nCaption B: The camera is tilting upwardsaround the aircraft carrier.", "gt-answer": "Caption A: The camera is moving clockwise around the aircraft carrier.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is moving clockwise around the aircraft carrier.\nOption 2: The camera is moving back and forth around the aircraft carrier.", "gt-answer": "Option 1: The camera is moving clockwise around the aircraft carrier.", "video-llm-prediction": "Option 1: The camera is moving clockwise around the aircraft carrier.", "match_success": true, "rating": 1 } ] }, "1072453637": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is panning to the back of a fighter jet.\nSentence B: The camera is panning downwards around a fighter jet.", "gt-answer": "Sentence A: The camera is panning to the back of a fighter jet.", "video-llm-prediction": "Sentence A: The camera is panning to the back of a fighter jet.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning to the back of a fighter jet.\nOption 2: The camera is panning upwards around a fighter jet.", "gt-answer": "Option 1: The camera is panning to the back of a fighter jet.", "video-llm-prediction": "Option 2: The camera is panning upwards around a fighter jet.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera is panning to the back of a fighter jet.\nCaption B: The camera is panning to the front of a fighter jet.", "gt-answer": "Caption A: The camera is panning to the back of a fighter jet.", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The fighter jet first shot one missile, then shot two missiles.\nCaption B: The fighter jet shot three missiles, then shot four missiles.", "gt-answer": "Caption A: The fighter jet first shot one missile, then shot two missiles.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The fighter jet shot two missiles.\nOption 2: The fighter jet first shot one missile, then shot two missiles.", "gt-answer": "Option 2: The fighter jet first shot one missile, then shot two missiles.", "video-llm-prediction": "Option 2: The fighter jet first shot one missile, then shot two missiles.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The fighter jet first shot one missile, then shot two missiles.\nSentence B: The fighter jet shot four missiles, then shot three missiles.", "gt-answer": "Sentence A: The fighter jet first shot one missile, then shot two missiles.", "video-llm-prediction": "Sentence A: The fighter jet first shot one missile, then shot two missiles.", "match_success": true, "rating": 1 } ] }, "3396473605": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The five stars appear from left to right.\nSentence B: The five stars disappear from right to left.", "gt-answer": "Sentence A: The five stars appear from left to right.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The five stars appear from left to right.\nOption 2: The five stars appear from top to bottom.", "gt-answer": "Option 1: The five stars appear from left to right.", "video-llm-prediction": "Option 2: The five stars appear from top to bottom.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The five stars appear from left to right.\nCaption B: The five stars appear from bottom to top.", "gt-answer": "Caption A: The five stars appear from left to right.", "video-llm-prediction": "Caption B: The five stars appear from bottom to top.", "match_success": true, "rating": 0 } ] }, "1086820415": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The large wave is moving horizontally towards the right side of the screen.\nSentence B: The large wave is moving vertically towards the bottom of the screen.", "gt-answer": "Sentence B: The large wave is moving vertically towards the bottom of the screen.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The large wave is moving vertically towards the top of the screen.\nOption 2: The large wave is moving vertically towards the bottom of the screen.", "gt-answer": "Option 2: The large wave is moving vertically towards the bottom of the screen.", "video-llm-prediction": "Option 1: The large wave is moving vertically towards the top of the screen.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The large wave is moving vertically towards the bottom of the screen.\nCaption B: The large wave is moving diagonally towards the top-left corner.", "gt-answer": "Caption A: The large wave is moving vertically towards the bottom of the screen.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1081513610": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A man in the video is discussing something.\nOption 2: The man in the video is swimming.", "gt-answer": "Option 1: A man in the video is discussing something.", "video-llm-prediction": "Option 1: A man in the video is discussing something.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A man in the video is discussing something.\nCaption B: The man in the video is sleeping.", "gt-answer": "Caption A: A man in the video is discussing something.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man in the video is running.\nSentence B: A man in the video is discussing something.", "gt-answer": "Sentence B: A man in the video is discussing something.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1073831006": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Zebras are running.\nSentence B: Zebras are swimming.", "gt-answer": "Sentence A: Zebras are running.", "video-llm-prediction": "Sentence A: Zebras are running.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Zebras are sleeping.\nCaption B: Zebras are running.", "gt-answer": "Caption B: Zebras are running.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Zebras are walking.\nOption 2: Zebras are running.", "gt-answer": "Option 2: Zebras are running.", "video-llm-prediction": "Option 2: Zebras are running.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The zebras are moving from right to left.\nCaption B: The zebras are moving from left to right.", "gt-answer": "Caption B: The zebras are moving from left to right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The zebras are moving from left to right.\nOption 2: The zebras are moving from top to bottom.", "gt-answer": "Option 1: The zebras are moving from left to right.", "video-llm-prediction": "Option 1: The zebras are moving from left to right.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The zebras are moving away from the camera.\nSentence B: The zebras are moving from left to right.", "gt-answer": "Sentence B: The zebras are moving from left to right.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video shows zebras moving in slow motion.\nSentence B: The zebras are stationary.", "gt-answer": "Sentence A: The video shows zebras moving in slow motion.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video shows zebras moving in slow motion.\nCaption B: The video is playing at normal speed.", "gt-answer": "Caption A: The video shows zebras moving in slow motion.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video shows zebras moving in slow motion.\nOption 2: The video is playing in time-lapse.", "gt-answer": "Option 1: The video shows zebras moving in slow motion.", "video-llm-prediction": "Option 1: The video shows zebras moving in slow motion.", "match_success": true, "rating": 1 } ] }, "1069338034": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The elephants are sleeping and resting.\nSentence B: The elephants are eating and drinking in the video.", "gt-answer": "Sentence B: The elephants are eating and drinking in the video.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The elephants are eating and drinking in the video.\nCaption B: They are swimming and taking a bath in the video.", "gt-answer": "Caption A: The elephants are eating and drinking in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The elephants are eating and drinking in the video.\nOption 2: The elephants are eating and playing.", "gt-answer": "Option 1: The elephants are eating and drinking in the video.", "video-llm-prediction": "Option 1: The elephants are eating and drinking in the video.", "match_success": true, "rating": 1 } ] }, "1076880707": { "action": [ { "question": "Which caption matches the video better?\nCaption A: A bear is eating honey near the tree.\nCaption B: A bear is scratching against a tree.", "gt-answer": "Caption B: A bear is scratching against a tree.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The bear is climbing a tree.\nSentence B: A bear is scratching against a tree.", "gt-answer": "Sentence B: A bear is scratching against a tree.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A bear is scratching against a tree.\nOption 2: The bear is taking a nap under the tree.", "gt-answer": "Option 1: A bear is scratching against a tree.", "video-llm-prediction": "Option 1: A bear is scratching against a tree.", "match_success": true, "rating": 1 } ] }, "1092278063": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The two rows of duck toy are moving in the same direction on a conveyor belt.\nSentence B: The two rows of duck toy are moving in opposite directions on a conveyor belt.", "gt-answer": "Sentence B: The two rows of duck toy are moving in opposite directions on a conveyor belt.", "video-llm-prediction": "Sentence A: The two rows of duck toy are moving in the same direction on a conveyor belt.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The two rows of duck toy are moving in opposite directions on a conveyor belt.\nOption 2: The two rows of duck toy are not moving on a conveyor belt.", "gt-answer": "Option 1: The two rows of duck toy are moving in opposite directions on a conveyor belt.", "video-llm-prediction": "Option 1: The two rows of duck toy are moving in opposite directions on a conveyor belt.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The movement pattern of the two rows of duck toy on a conveyor belt is circular motion.\nCaption B: The two rows of duck toy are moving in opposite directions on a conveyor belt.", "gt-answer": "Caption B: The two rows of duck toy are moving in opposite directions on a conveyor belt.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The conveyor belt is moving at a super fast speed.\nOption 2: The speed of the conveyor belt is normal.", "gt-answer": "Option 2: The speed of the conveyor belt is normal.", "video-llm-prediction": "Option 1: The conveyor belt is moving at a super fast speed.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The conveyor belt is stopped.\nCaption B: The speed of the conveyor belt is normal.", "gt-answer": "Caption B: The speed of the conveyor belt is normal.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the conveyor belt is normal.\nSentence B: The conveyor belt is moving slowly.", "gt-answer": "Sentence A: The speed of the conveyor belt is normal.", "video-llm-prediction": "Sentence B: The conveyor belt is moving slowly.", "match_success": true, "rating": 0 } ] }, "1024867412": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The dog is sleeping.\nCaption B: The dog is driving a car.", "gt-answer": "Caption B: The dog is driving a car.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A dog is driving a car.\nOption 2: A video showing a dog eating.", "gt-answer": "Option 1: A dog is driving a car.", "video-llm-prediction": "Option 1: A dog is driving a car.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dog is barking.\nSentence B: A dog is driving a car.", "gt-answer": "Sentence B: A dog is driving a car.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The car is taking a right turn.\nCaption B: The car is taking a left turn.", "gt-answer": "Caption A: The car is taking a right turn.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The car is going backward.\nSentence B: The car is taking a right turn.", "gt-answer": "Sentence B: The car is taking a right turn.", "video-llm-prediction": "Sentence A: The car is going backward.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The car is taking a right turn.\nOption 2: The car is moving forward.", "gt-answer": "Option 1: The car is taking a right turn.", "video-llm-prediction": "Option 2: The car is moving forward.", "match_success": true, "rating": 0 } ] }, "1076877854": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The robots are caring for seedlings.\nCaption B: The robots are watering seedlings.", "gt-answer": "Caption A: The robots are caring for seedlings.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The robots are caring for seedlings.\nOption 2: The robots are harvesting crops.", "gt-answer": "Option 1: The robots are caring for seedlings.", "video-llm-prediction": "Option 1: The robots are caring for seedlings.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The robots are plowing the soil.\nSentence B: The robots are caring for seedlings.", "gt-answer": "Sentence B: The robots are caring for seedlings.", "video-llm-prediction": "Sentence B: The robots are caring for seedlings.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The robotic arm is moving to the left side of the screen.\nSentence B: The closest robotic arm is moving to the right side of the screen.", "gt-answer": "Sentence B: The closest robotic arm is moving to the right side of the screen.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The closest robotic arm is moving to the right side of the screen.\nCaption B: The robotic arm is moving away from the camera.", "gt-answer": "Caption A: The closest robotic arm is moving to the right side of the screen.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The robotic arm is rotating.\nOption 2: The closest robotic arm is moving to the right side of the screen.", "gt-answer": "Option 2: The closest robotic arm is moving to the right side of the screen.", "video-llm-prediction": "Option 1: The robotic arm is rotating.", "match_success": true, "rating": 0 } ] }, "1104673225": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is making salad.\nOption 2: The woman is eating salad.", "gt-answer": "Option 2: The woman is eating salad.", "video-llm-prediction": "Option 2: The woman is eating salad.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is wrapping up salad.\nSentence B: The woman is eating salad.", "gt-answer": "Sentence B: The woman is eating salad.", "video-llm-prediction": "Sentence A: The woman is wrapping up salad.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The woman is eating salad.\nCaption B: The woman is throwing away salad.", "gt-answer": "Caption A: The woman is eating salad.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1100468035": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The camera is zooming backward in the video.\nCaption B: The camera is zooming forward in the video.", "gt-answer": "Caption B: The camera is zooming forward in the video.", "video-llm-prediction": "Caption B: The camera is zooming forward in the video.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming forward in the video.\nSentence B: The camera is tracking right.", "gt-answer": "Sentence A: The camera is zooming forward in the video.", "video-llm-prediction": "Sentence A: The camera is zooming forward in the video.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning left.\nOption 2: The camera is zooming forward in the video.", "gt-answer": "Option 2: The camera is zooming forward in the video.", "video-llm-prediction": "Option 2: The camera is zooming forward in the video.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The door is gradually closing.\nCaption B: The door is gradually opening.", "gt-answer": "Caption B: The door is gradually opening.", "video-llm-prediction": "Caption B: The door is gradually opening.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The door is gradually opening.\nSentence B: The door is remaining closed.", "gt-answer": "Sentence A: The door is gradually opening.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The door is gradually opening.\nOption 2: The door is gradually closing.", "gt-answer": "Option 1: The door is gradually opening.", "video-llm-prediction": "Option 2: The door is gradually closing.", "match_success": true, "rating": 0 } ] }, "315784": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The speedometer in the center is moving faster than the one on the left.\nOption 2: The speedometer in the center is moving slower than the one on the left.", "gt-answer": "Option 1: The speedometer in the center is moving faster than the one on the left.", "video-llm-prediction": "Option 1: The speedometer in the center is moving faster than the one on the left.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speedometer in the center is moving faster than the one on the left.\nSentence B: The speedometer in the center is stationary.", "gt-answer": "Sentence A: The speedometer in the center is moving faster than the one on the left.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speedometer in the center is moving at the same speed as the one on the left.\nCaption B: The speedometer in the center is moving faster than the one on the left.", "gt-answer": "Caption B: The speedometer in the center is moving faster than the one on the left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "3411806181": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is cleaning an electric vehicle.\nSentence B: A person is recharging an electric vehicle.", "gt-answer": "Sentence B: A person is recharging an electric vehicle.", "video-llm-prediction": "Sentence B: A person is recharging an electric vehicle.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A person is recharging an electric vehicle.\nCaption B: A person is repairing an electric vehicle.", "gt-answer": "Caption A: A person is recharging an electric vehicle.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is repairing an EV.\nOption 2: A person is recharging an electric vehicle.", "gt-answer": "Option 2: A person is recharging an electric vehicle.", "video-llm-prediction": "Option 2: A person is recharging an electric vehicle.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The person is unplugging the charging gun from the car.\nOption 2: The person is plugging the charging gun into the car.", "gt-answer": "Option 2: The person is plugging the charging gun into the car.", "video-llm-prediction": "Option 1: The person is unplugging the charging gun from the car.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is moving the charging gun away from the car.\nSentence B: The person is plugging the charging gun into the car.", "gt-answer": "Sentence B: The person is plugging the charging gun into the car.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person is holding the charging gun still.\nCaption B: The person is plugging the charging gun into the car.", "gt-answer": "Caption B: The person is plugging the charging gun into the car.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing in fast motion.\nOption 2: The video is playing in slow motion.", "gt-answer": "Option 2: The video is playing in slow motion.", "video-llm-prediction": "Option 2: The video is playing in slow motion.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing in slow motion.\nSentence B: The video is playing at normal speed.", "gt-answer": "Sentence A: The video is playing in slow motion.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video is time-lapse.\nCaption B: The video is playing in slow motion.", "gt-answer": "Caption B: The video is playing in slow motion.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1043054206": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The yellow car is driving slower than other cars.\nSentence B: The yellow car is driving faster than other cars.", "gt-answer": "Sentence B: The yellow car is driving faster than other cars.", "video-llm-prediction": "Sentence B: The yellow car is driving faster than other cars.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The yellow car is driving faster than other cars.\nCaption B: The yellow car is currently not in motion.", "gt-answer": "Caption A: The yellow car is driving faster than other cars.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The yellow car is traveling at an equivalent speed to other cars.\nOption 2: The yellow car is driving faster than other cars.", "gt-answer": "Option 2: The yellow car is driving faster than other cars.", "video-llm-prediction": "Option 2: The yellow car is driving faster than other cars.", "match_success": true, "rating": 1 } ] }, "1096238125": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The man and woman are lifting weights.\nCaption B: The man and woman are doing sit-ups.", "gt-answer": "Caption A: The man and woman are lifting weights.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man and woman are lifting weights.\nSentence B: The man and woman are jumping rope.", "gt-answer": "Sentence A: The man and woman are lifting weights.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man and woman are lifting weights.\nOption 2: The man and woman are doing push-ups.", "gt-answer": "Option 1: The man and woman are lifting weights.", "video-llm-prediction": "Option 1: The man and woman are lifting weights.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which caption matches the video better?\nCaption A: The man is lifting the kettlebell at roughly the same speed as the woman.\nCaption B: The man is lifting the kettlebell at a much slower speed than the woman.", "gt-answer": "Caption A: The man is lifting the kettlebell at roughly the same speed as the woman.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is lifting the kettlebell at roughly the same speed as the woman.\nOption 2: The man is lifting the kettlebell faster than the woman.", "gt-answer": "Option 1: The man is lifting the kettlebell at roughly the same speed as the woman.", "video-llm-prediction": "Option 1: The man is lifting the kettlebell at roughly the same speed as the woman.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is significantly faster in lifting the kettlebell compared to the woman.\nSentence B: The man is lifting the kettlebell at roughly the same speed as the woman.", "gt-answer": "Sentence B: The man is lifting the kettlebell at roughly the same speed as the woman.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1103088481": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is selling vegetables at the grocery store.\nSentence B: A person is buying vegetables at the grocery store.", "gt-answer": "Sentence B: A person is buying vegetables at the grocery store.", "video-llm-prediction": "Sentence B: A person is buying vegetables at the grocery store.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A person is buying vegetables at the market/grocery store.\nCaption B: The person is packaging vegetables at the market/grocery store.", "gt-answer": "Caption A: A person is buying vegetables at the market/grocery store.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person is buying vegetables at the market/grocery store.\nOption 2: The person is cooking vegetables at the market/grocery store.", "gt-answer": "Option 1: A person is buying vegetables at the market/grocery store.", "video-llm-prediction": "Option 1: A person is buying vegetables at the market/grocery store.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: First, a black vegetable is being placed in the trolley and then a green vegetable.\nSentence B: First, a green vegetable is being placed in the trolley and then a black vegetable.", "gt-answer": "Sentence B: First, a green vegetable is being placed in the trolley and then a black vegetable.", "video-llm-prediction": "Sentence B: First, a green vegetable is being placed in the trolley and then a black vegetable.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Place a green vegetable into the trolley and then place a black vegetable into the trolley.\nCaption B: Place a black vegetable into the trolley and then place a green vegetable into the trolley.", "gt-answer": "Caption A: Place a green vegetable into the trolley and then place a black vegetable into the trolley.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The correct order of events in the video is to place a green vegetable into the trolley and then place a black vegetable into the trolley.\nOption 2: Only a green vegetable is being placed.", "gt-answer": "Option 1: The correct order of events in the video is to place a green vegetable into the trolley and then place a black vegetable into the trolley.", "video-llm-prediction": "Option 1: The correct order of events in the video is to place a green vegetable into the trolley and then place a black vegetable into the trolley.", "match_success": true, "rating": 1 } ] }, "1055981522": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The 3d shapes are transforming from cubes into spheres.\nCaption B: The 3d shapes are transforming from spheres into cubes.", "gt-answer": "Caption A: The 3d shapes are transforming from cubes into spheres.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3d shapes are transforming from spheres into cubes.\nOption 2: The 3d shapes are transforming from cubes into spheres.", "gt-answer": "Option 2: The 3d shapes are transforming from cubes into spheres.", "video-llm-prediction": "Option 1: The 3d shapes are transforming from spheres into cubes.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3d shapes are transforming from cubes into spheres.\nSentence B: The 3d shapes are transforming from spheres into cubes.", "gt-answer": "Sentence A: The 3d shapes are transforming from cubes into spheres.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1061017846": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The boat on the top of the screen is moving faster than the boat on the bottom of the screen.\nSentence B: The boat on the top of the screen travels at the same speed as the boat on the bottom of the screen.", "gt-answer": "Sentence B: The boat on the top of the screen travels at the same speed as the boat on the bottom of the screen.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The boat on the top of the screen is moving slower than the boat on the bottom of the screen.\nOption 2: The boat on the top of the screen travels at the same speed as the boat on the bottom of the screen.", "gt-answer": "Option 2: The boat on the top of the screen travels at the same speed as the boat on the bottom of the screen.", "video-llm-prediction": "Option 1: The boat on the top of the screen is moving slower than the boat on the bottom of the screen.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The boat on the top of the screen travels at the same speed as the boat on the bottom of the screen.\nCaption B: No, the boat on the top of the screen is not moving at the same speed.", "gt-answer": "Caption A: The boat on the top of the screen travels at the same speed as the boat on the bottom of the screen.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1097341567": { "order": [ { "question": "Which caption matches the video better?\nCaption A: First, the bars appear, then the arrow appears.\nCaption B: First, the arrow appears, then the bars appear.", "gt-answer": "Caption A: First, the bars appear, then the arrow appears.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The bars and the arrow appear at the same time.\nOption 2: First, the bars appear, then the arrow appears.", "gt-answer": "Option 2: First, the bars appear, then the arrow appears.", "video-llm-prediction": "Option 2: The bars and the arrow appear at the same time.", "match_success": false, "chatgpt-response": "Incorrect", "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: First, the bars appear, then the arrow appears.\nSentence B: Only the arrow appears in the video.", "gt-answer": "Sentence A: First, the bars appear, then the arrow appears.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1056433484": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The Earth moves around the Sun in a counter-clockwise direction.\nSentence B: The Earth moves around the Sun in a clockwise direction.", "gt-answer": "Sentence A: The Earth moves around the Sun in a counter-clockwise direction.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The Earth moves around the Sun in a counter-clockwise direction.\nCaption B: The Earth travels upwards in its orbit around the Sun.", "gt-answer": "Caption A: The Earth moves around the Sun in a counter-clockwise direction.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The Earth moves around the Sun in a counter-clockwise direction.\nOption 2: The Earth travels from vertically in its orbit around the Sun.", "gt-answer": "Option 1: The Earth moves around the Sun in a counter-clockwise direction.", "video-llm-prediction": "Option 1: The Earth moves around the Sun in a counter-clockwise direction.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The earth rotates slower than the sun.\nOption 2: The earth rotates faster than the sun.", "gt-answer": "Option 2: The earth rotates faster than the sun.", "video-llm-prediction": "Option 2: The earth rotates faster than the sun.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the earth's rotation is faster than the sun.\nSentence B: The earth and sun rotate at equal speeds.", "gt-answer": "Sentence A: The speed of the earth's rotation is faster than the sun.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the earth's rotation is faster than the sun.\nCaption B: The sun rotates faster than the earth.", "gt-answer": "Caption A: The speed of the earth's rotation is faster than the sun.", "video-llm-prediction": "Caption B: The sun rotates faster than the earth.", "match_success": true, "rating": 0 } ] }, "1073914229": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The trains are moving towards each other.\nSentence B: The trains are moving away from each other.", "gt-answer": "Sentence A: The trains are moving towards each other.", "video-llm-prediction": "Sentence A: The trains are moving towards each other.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The trains are moving away from each other.\nOption 2: The trains are moving towards each other.", "gt-answer": "Option 2: The trains are moving towards each other.", "video-llm-prediction": "Option 1: The trains are moving away from each other.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The trains are moving towards each other.\nCaption B: The trains are moving away from each other.", "gt-answer": "Caption A: The trains are moving towards each other.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1099360359": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The train closer to the screen drives faster.\nSentence B: The train further away from the screen drives faster.", "gt-answer": "Sentence B: The train further away from the screen drives faster.", "video-llm-prediction": "Sentence B: The train further away from the screen drives faster.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The train further away from the screen drives faster.\nCaption B: The train further away from the screen drives slower.", "gt-answer": "Caption A: The train further away from the screen drives faster.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The two trains drive at the same speed.\nOption 2: The train further away from the screen drives faster.", "gt-answer": "Option 2: The train further away from the screen drives faster.", "video-llm-prediction": "Option 2: The train further away from the screen drives faster.", "match_success": true, "rating": 1 } ] }, "1098970151": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The cat is licking its paw.\nOption 2: The cat is waving its paw.", "gt-answer": "Option 1: The cat is licking its paw.", "video-llm-prediction": "Option 1: The cat is licking its paw.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The cat is licking its paw.\nSentence B: The cat is biting its paw.", "gt-answer": "Sentence A: The cat is licking its paw.", "video-llm-prediction": "Sentence A: The cat is licking its paw.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The cat is licking its paw.\nCaption B: The cat is licking its belly.", "gt-answer": "Caption A: The cat is licking its paw.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1081734740": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The leaf is turning from green to yellow.\nOption 2: The leaf is turning from yellow to green.", "gt-answer": "Option 1: The leaf is turning from green to yellow.", "video-llm-prediction": "Option 1: The leaf is turning from green to yellow.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The texture of the leaf is turning from green to yellow.\nCaption B: The leaf is turning from green to white.", "gt-answer": "Caption A: The texture of the leaf is turning from green to yellow.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The texture of the leaf is turning from yellow to green.\nSentence B: The texture of the leaf is turning from green to yellow.", "gt-answer": "Sentence B: The texture of the leaf is turning from green to yellow.", "video-llm-prediction": "Sentence A: The texture of the leaf is turning from yellow to green.", "match_success": true, "rating": 0 } ] }, "1093719871": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The pink flowers are turning from full blossom to withered.\nSentence B: The pink flowers are turning from withered to full blossom.", "gt-answer": "Sentence B: The pink flowers are turning from withered to full blossom.", "video-llm-prediction": "Sentence A: The pink flowers are turning from full blossom to withered.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pink flowers are growing taller.\nOption 2: The pink flowers are turning from withered to full blossom.", "gt-answer": "Option 2: The pink flowers are turning from withered to full blossom.", "video-llm-prediction": "Option 2: The pink flowers are turning from withered to full blossom.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The pink flowers are falling off petals.\nCaption B: The pink flowers are turning from withered to full blossom.", "gt-answer": "Caption B: The pink flowers are turning from withered to full blossom.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1042819039": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is playing in slow motion.\nOption 2: The video is playing in time-lapse.", "gt-answer": "Option 2: The video is playing in time-lapse.", "video-llm-prediction": "Option 1: The video is playing in slow motion.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is playing in time-lapse.\nSentence B: The video is playing at normal speed.", "gt-answer": "Sentence A: The video is playing in time-lapse.", "video-llm-prediction": "Sentence A: The video is playing in time-lapse.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is playing in time-lapse.\nCaption B: The video is playing in slow motion.", "gt-answer": "Caption A: The video is playing in time-lapse.", "video-llm-prediction": "Caption B: The video is playing in slow motion.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The street was filled with people, then it was filled with vehicles.\nOption 2: The street was filled with vehicles, then it was filled with people.", "gt-answer": "Option 1: The street was filled with people, then it was filled with vehicles.", "video-llm-prediction": "Option 2: The street was filled with vehicles, then it was filled with people.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The street was filled with vehicles, then it was filled with people.\nCaption B: The street was filled with people, then it was filled with vehicles.", "gt-answer": "Caption B: The street was filled with people, then it was filled with vehicles.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The street was filled with people, then it was filled with vehicles.\nSentence B: The street was completely empty and then filled with vehicles.", "gt-answer": "Sentence A: The street was filled with people, then it was filled with vehicles.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1093139559": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming out from three football players.\nSentence B: The camera is zooming into three football players.", "gt-answer": "Sentence B: The camera is zooming into three football players.", "video-llm-prediction": "Sentence A: The camera is zooming out from three football players.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera is zooming into three football players.\nCaption B: The camera is panning left.", "gt-answer": "Caption A: The camera is zooming into three football players.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is zooming into three football players.\nOption 2: The camera is panning right.", "gt-answer": "Option 1: The camera is zooming into three football players.", "video-llm-prediction": "Option 1: The camera is zooming into three football players.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The light on the football players is turning brighter.\nOption 2: The light on the football players is turning darker.", "gt-answer": "Option 1: The light on the football players is turning brighter.", "video-llm-prediction": "Option 2: The light on the football players is turning darker.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The light on the football players is staying the same.\nCaption B: The light on the football players is turning brighter.", "gt-answer": "Caption B: The light on the football players is turning brighter.", "video-llm-prediction": "Caption B: The light on the football players is turning brighter.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The light on the football players is dimming.\nSentence B: The light on the football players is turning brighter.", "gt-answer": "Sentence B: The light on the football players is turning brighter.", "video-llm-prediction": "Sentence B: The light on the football players is turning brighter.", "match_success": true, "rating": 1 } ] }, "1055973887": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The fire ball is getting smaller.\nOption 2: The fire ball is getting larger.", "gt-answer": "Option 2: The fire ball is getting larger.", "video-llm-prediction": "Option 2: The fire ball is getting larger.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The fire ball is shrinking in size.\nSentence B: The fire ball is getting larger.", "gt-answer": "Sentence B: The fire ball is getting larger.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The fire ball is getting larger.\nCaption B: The fire ball is getting smaller.", "gt-answer": "Caption A: The fire ball is getting larger.", "video-llm-prediction": "Caption A: The fire ball is getting larger.", "match_success": true, "rating": 1 } ] }, "1098710341": { "action": [ { "question": "Which caption matches the video better?\nCaption A: A person is pouring water into a glass.\nCaption B: A person is drinking water from a glass.", "gt-answer": "Caption A: A person is pouring water into a glass.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is pouring water into a glass.\nSentence B: The person is washing hands with water.", "gt-answer": "Sentence A: A person is pouring water into a glass.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Water is being spilled on the floor.\nOption 2: A person is pouring water into a glass.", "gt-answer": "Option 2: A person is pouring water into a glass.", "video-llm-prediction": "Option 2: A person is pouring water into a glass.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The glass is going from empty to full of water.\nOption 2: The glass is going from full of water to empty.", "gt-answer": "Option 1: The glass is going from empty to full of water.", "video-llm-prediction": "Option 1: The glass is going from empty to full of water.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The glass is going from full of water to empty.\nSentence B: The glass is going from empty to full of water.", "gt-answer": "Sentence B: The glass is going from empty to full of water.", "video-llm-prediction": "Sentence A: The glass is going from full of water to empty.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The glass is going from empty to full of water.\nCaption B: The glass is going from full of water to empty.", "gt-answer": "Caption A: The glass is going from empty to full of water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1062736174": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The chef is chopping steak.\nCaption B: The chef is sprinkling salt on the steak.", "gt-answer": "Caption B: The chef is sprinkling salt on the steak.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The chef is sprinkling vegetables on the steak.\nSentence B: The chef is sprinkling salt on the steak.", "gt-answer": "Sentence B: The chef is sprinkling salt on the steak.", "video-llm-prediction": "Sentence B: The chef is sprinkling salt on the steak.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The chef is sprinkling salt on the steak.\nOption 2: The chef is grilling steak.", "gt-answer": "Option 1: The chef is sprinkling salt on the steak.", "video-llm-prediction": "Option 1: The chef is sprinkling salt on the steak.", "match_success": true, "rating": 1 } ] }, "1099116143": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: White foam appears on the surface of the pink liquid.\nCaption B: White foam disappears from the surface of the pink liquid.", "gt-answer": "Caption A: White foam appears on the surface of the pink liquid.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pink liquid is freezing.\nOption 2: White foam appears on the surface of the pink liquid.", "gt-answer": "Option 2: White foam appears on the surface of the pink liquid.", "video-llm-prediction": "Option 2: White foam appears on the surface of the pink liquid.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: White foam appears on the surface of the pink liquid.\nSentence B: The pink liquid is evaporating.", "gt-answer": "Sentence A: White foam appears on the surface of the pink liquid.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1108398787": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The person is watching videos on a smartphone device.\nOption 2: The person is operating system settings on a smartphone device.", "gt-answer": "Option 2: The person is operating system settings on a smartphone device.", "video-llm-prediction": "Option 1: The person is watching videos on a smartphone device.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person is making a phone call using a smartphone device.\nCaption B: The person is operating system settings on a smartphone device.", "gt-answer": "Caption B: The person is operating system settings on a smartphone device.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is operating system settings on a smartphone device.\nSentence B: The person is chatting on a smartphone device.", "gt-answer": "Sentence A: The person is operating system settings on a smartphone device.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The person is scrolling down and then entering passwords.\nCaption B: The person is entering passwords and then scrolling down.", "gt-answer": "Caption A: The person is scrolling down and then entering passwords.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is scrolling down and then entering passwords.\nSentence B: The person is entering passwords and then scrolling up.", "gt-answer": "Sentence A: The person is scrolling down and then entering passwords.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is scrolling down and then entering passwords.\nOption 2: The person is scrolling up and then entering passwords.", "gt-answer": "Option 1: The person is scrolling down and then entering passwords.", "video-llm-prediction": "Option 1: The person is scrolling down and then entering passwords.", "match_success": true, "rating": 1 } ] }, "1080591311": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The jellyfish is floating downwards.\nCaption B: The jellyfish is floating upwards.", "gt-answer": "Caption B: The jellyfish is floating upwards.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The jellyfish is moving towards the right.\nSentence B: The jellyfish is floating upwards.", "gt-answer": "Sentence B: The jellyfish is floating upwards.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The jellyfish is sinking downwards.\nOption 2: The jellyfish is floating upwards.", "gt-answer": "Option 2: The jellyfish is floating upwards.", "video-llm-prediction": "Option 1: The jellyfish is sinking downwards.", "match_success": true, "rating": 0 } ] }, "1107034223": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The bear is catching fishes in the river.\nOption 2: The bear is swallowing fishes in the river.", "gt-answer": "Option 1: The bear is catching fishes in the river.", "video-llm-prediction": "Option 2: The bear is swallowing fishes in the river.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The bear is catching fishes in the river.\nCaption B: The bear is climbing trees.", "gt-answer": "Caption A: The bear is catching fishes in the river.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The bear is catching fishes in the river.\nSentence B: The bear is sleeping in the river.", "gt-answer": "Sentence A: The bear is catching fishes in the river.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The bear turned back and then caught a fish.\nOption 2: The bear caught a fish and then turned back.", "gt-answer": "Option 2: The bear caught a fish and then turned back.", "video-llm-prediction": "Option 2: The bear caught a fish and then turned back.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The bear caught a fish and then turned back.\nSentence B: The bear caught a fish and then climbed up a tree.", "gt-answer": "Sentence A: The bear caught a fish and then turned back.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The bear caught a fish and then turned back.\nCaption B: The bear jumped into the water and then caught a fish.", "gt-answer": "Caption A: The bear caught a fish and then turned back.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1025623079": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The skyscraper is growing taller.\nCaption B: The skyscraper is collapsing.", "gt-answer": "Caption B: The skyscraper is collapsing.", "video-llm-prediction": "Caption B: The skyscraper is collapsing.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The skyscraper is growing taller.\nOption 2: The skyscraper is collapsing.", "gt-answer": "Option 2: The skyscraper is collapsing.", "video-llm-prediction": "Option 2: The skyscraper is collapsing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The skyscraper is standing up.\nSentence B: The skyscraper is collapsing.", "gt-answer": "Sentence B: The skyscraper is collapsing.", "video-llm-prediction": "Sentence B: The skyscraper is collapsing.", "match_success": true, "rating": 1 } ] }, "1094782389": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The dog is running towards a woman.\nCaption B: The dog is giving a high five to a woman.", "gt-answer": "Caption B: The dog is giving a high five to a woman.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dog is barking to a woman.\nSentence B: The dog is giving a high five to a woman.", "gt-answer": "Sentence B: The dog is giving a high five to a woman.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The dog is giving a high five to a woman.\nOption 2: The dog is catching food from a woman.", "gt-answer": "Option 1: The dog is giving a high five to a woman.", "video-llm-prediction": "Option 1: The dog is giving a high five to a woman.", "match_success": true, "rating": 1 } ] }, "3411228673": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is moving upwards along the skyscraper buildings.\nSentence B: The camera is moving downwards along the skyscraper buildings.", "gt-answer": "Sentence A: The camera is moving upwards along the skyscraper buildings.", "video-llm-prediction": "Sentence A: The camera is moving upwards along the skyscraper buildings.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The movement in the video is upwards among skyscraper buildings.\nOption 2: The camera is moving backwards.", "gt-answer": "Option 1: The movement in the video is upwards among skyscraper buildings.", "video-llm-prediction": "Option 1: The movement in the video is upwards among skyscraper buildings.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The movement in the video is upwards among skyscraper buildings.\nCaption B: The camera is moving downwards.", "gt-answer": "Caption A: The movement in the video is upwards among skyscraper buildings.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1043487715": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Children are diving into water.\nOption 2: Children are eating.", "gt-answer": "Option 1: Children are diving into water.", "video-llm-prediction": "Option 1: Children are diving into water.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Children can be seen diving into water in the video.\nSentence B: A group of children is sleeping.", "gt-answer": "Sentence A: Children can be seen diving into water in the video.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Children can be seen diving into water in the video.\nCaption B: The children are hiking.", "gt-answer": "Caption A: Children can be seen diving into water in the video.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The children are diving into water and then making gestures to the camera.\nSentence B: The children are making gestures to the camera and then diving into water.", "gt-answer": "Sentence A: The children are diving into water and then making gestures to the camera.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The children are diving into water after making gestures to the camera.\nCaption B: The children are diving into water and then making gestures to the camera.", "gt-answer": "Caption B: The children are diving into water and then making gestures to the camera.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The children are making gestures to the camera first and then diving into water.\nOption 2: The children are diving into water and then making gestures to the camera.", "gt-answer": "Option 2: The children are diving into water and then making gestures to the camera.", "video-llm-prediction": "Option 1: The children are making gestures to the camera first and then diving into water.", "match_success": true, "rating": 0 } ] }, "1093737353": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is panning to the left.\nSentence B: The camera is panning to the right.", "gt-answer": "Sentence B: The camera is panning to the right.", "video-llm-prediction": "Sentence B: The camera is panning to the right.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The camera is panning to the right.\nCaption B: The camera is tilting up.", "gt-answer": "Caption A: The camera is panning to the right.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning to the right.\nOption 2: The camera is zooming in.", "gt-answer": "Option 1: The camera is panning to the right.", "video-llm-prediction": "Option 2: The camera is zooming in.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video shows a beaker followed by a line of test tubes.\nSentence B: The video shows a line of test tubes followed by a beaker.", "gt-answer": "Sentence B: The video shows a line of test tubes followed by a beaker.", "video-llm-prediction": "Sentence A: The video shows a beaker followed by a line of test tubes.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a microscope and then a beaker are shown.\nOption 2: The video shows a line of test tubes followed by a beaker.", "gt-answer": "Option 2: The video shows a line of test tubes followed by a beaker.", "video-llm-prediction": "Option 1: In the video, a microscope and then a beaker are shown.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video shows a line of test tubes followed by a beaker.\nCaption B: A beaker is shown, followed by a line of test tubes.", "gt-answer": "Caption A: The video shows a line of test tubes followed by a beaker.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1063373449": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The coronavirus is dissolving.\nOption 2: The coronavirus is enlarging.", "gt-answer": "Option 1: The coronavirus is dissolving.", "video-llm-prediction": "Option 2: The coronavirus is enlarging.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The coronavirus is dissolving under the attack of antibodies.\nSentence B: The coronavirus is assembling together.", "gt-answer": "Sentence A: The coronavirus is dissolving under the attack of antibodies.", "video-llm-prediction": "Sentence A: The coronavirus is dissolving under the attack of antibodies.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The coronavirus is dissolving under the attack of antibodies.\nCaption B: The coronavirus is assembling together.", "gt-answer": "Caption A: The coronavirus is dissolving under the attack of antibodies.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1017768724": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The person is moving leftwards.\nOption 2: The person is moving rightwards.", "gt-answer": "Option 2: The person is moving rightwards.", "video-llm-prediction": "Option 2: The person is moving rightwards.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is moving rightwards.\nSentence B: The person is moving upwards.", "gt-answer": "Sentence A: The person is moving rightwards.", "video-llm-prediction": "Sentence A: The person is moving rightwards.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The person is moving downwards.\nCaption B: The person is moving rightwards.", "gt-answer": "Caption B: The person is moving rightwards.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1106280325": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is playing guitar.\nOption 2: The woman is reading a book.", "gt-answer": "Option 2: The woman is reading a book.", "video-llm-prediction": "Option 2: The woman is reading a book.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is reading a book.\nCaption B: The woman is hiking.", "gt-answer": "Caption A: The woman is reading a book.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is reading a book.\nSentence B: The woman is dancing.", "gt-answer": "Sentence A: The woman is reading a book.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A body of water is shown, then a girl is shown reading a book\nOption 2: A girl is shown reading a book, then a body of water is shown.", "gt-answer": "Option 2: A girl is shown reading a book, then a body of water is shown.", "video-llm-prediction": "Option 2: A girl is shown reading a book, then a body of water is shown.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl and the river appear at the same time in the video.\nSentence B: In the video, a girl is shown reading a book, then a body of water is shown.", "gt-answer": "Sentence B: In the video, a girl is shown reading a book, then a body of water is shown.", "video-llm-prediction": "Sentence A: The girl and the river appear at the same time in the video.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video shows a girl reading a book and a body of water simultaneously.\nCaption B: In the video, a girl is shown reading a book, then a body of water is shown.", "gt-answer": "Caption B: In the video, a girl is shown reading a book, then a body of water is shown.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1100117263": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The little lion is jumping onto the back of an adult lion.\nSentence B: The little lion is falling from the back of an adult lion.", "gt-answer": "Sentence B: The little lion is falling from the back of an adult lion.", "video-llm-prediction": "Sentence A: The little lion is jumping onto the back of an adult lion.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The little lion is sitting nearby an adult lion.\nCaption B: The little lion is falling from the back of an adult lion.", "gt-answer": "Caption B: The little lion is falling from the back of an adult lion.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The little lion is falling from the back of an adult lion.\nOption 2: The little lion is sitting on the back of an adult lion.", "gt-answer": "Option 1: The little lion is falling from the back of an adult lion.", "video-llm-prediction": "Option 2: The little lion is sitting on the back of an adult lion.", "match_success": true, "rating": 0 } ] }, "15695290": { "action": [ { "question": "Which caption matches the video better?\nCaption A: A person is drawing a picture.\nCaption B: A person is playing soccer.", "gt-answer": "Caption A: A person is drawing a picture.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is drawing a picture.\nSentence B: The person is reading a book.", "gt-answer": "Sentence A: A person is drawing a picture.", "video-llm-prediction": "A person is drawing a picture.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person is drawing a picture.\nOption 2: The person is dancing.", "gt-answer": "Option 1: A person is drawing a picture.", "video-llm-prediction": "Option 1: A person is drawing a picture.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, first a house is drawn and then a family of people is drawn.\nSentence B: In the video, first a family of people is drawn and then a house is drawn.", "gt-answer": "Sentence A: In the video, first a house is drawn and then a family of people is drawn.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: In the video, first a house is drawn and then a family of people is drawn.\nCaption B: Both events, drawing the house and drawing the family, occur at the same time in the video.", "gt-answer": "Caption A: In the video, first a house is drawn and then a family of people is drawn.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The house being drawn occurs after the family of people is drawn.\nOption 2: In the video, first a house is drawn and then a family of people is drawn.", "gt-answer": "Option 2: In the video, first a house is drawn and then a family of people is drawn.", "video-llm-prediction": "Option 2: In the video, first a house is drawn and then a family of people is drawn.", "match_success": true, "rating": 1 } ] }, "1091090295": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: First, a bird is seen flying onto the back of a hippo. Then, a hippo pokes its head out of water.\nOption 2: First, a hippo pokes its head out of water. Then, a bird is seen flying onto the back of another hippo.", "gt-answer": "Option 1: First, a bird is seen flying onto the back of a hippo. Then, a hippo pokes its head out of water.", "video-llm-prediction": "Option 1", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A hippo puts its head into water before a bird flying onto the back of another hippo.\nSentence B: First, a bird is seen flying onto the back of a hippo. Then, a hippo pokes its head out of water.", "gt-answer": "Sentence B: First, a bird is seen flying onto the back of a hippo. Then, a hippo pokes its head out of water.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: First, a bird is seen flying onto the back of a hippo. Then, a hippo pokes its head out of water.\nCaption B: Simultaneously, a bird flying onto the back of a hippo and another hippo pokes its head out of water.", "gt-answer": "Caption A: First, a bird is seen flying onto the back of a hippo. Then, a hippo pokes its head out of water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1021488277": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is dropping down the pineapple.\nSentence B: A person is picking up the pineapple.", "gt-answer": "Sentence B: A person is picking up the pineapple.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pineapple is being rotated by a person.\nOption 2: A person is picking up the pineapple.", "gt-answer": "Option 2: A person is picking up the pineapple.", "video-llm-prediction": "Option 1: The pineapple is being rotated by a person.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: A person is picking up the pineapple.\nCaption B: The pineapple is being pushed forward by a person.", "gt-answer": "Caption A: A person is picking up the pineapple.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1106899445": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Someone is removing toothpaste from the toothbrush.\nSentence B: The person is squeezing out toothpaste on the toothbrush.", "gt-answer": "Sentence B: The person is squeezing out toothpaste on the toothbrush.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The person is squeezing out toothpaste on the toothbrush.\nCaption B: The person is brushing teeth.", "gt-answer": "Caption A: The person is squeezing out toothpaste on the toothbrush.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is squeezing out toothpaste on the toothbrush.\nOption 2: A video showing a person wiping off toothpaste from the toothbrush.", "gt-answer": "Option 1: The person is squeezing out toothpaste on the toothbrush.", "video-llm-prediction": "Option 1: The person is squeezing out toothpaste on the toothbrush.", "match_success": true, "rating": 1 } ] }, "1067925569": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Firstly, a cargo train is shown, secondly a container ship is shown.\nOption 2: Firstly, a container ship is shown, secondly a cargo train is shown.", "gt-answer": "Option 2: Firstly, a container ship is shown, secondly a cargo train is shown.", "video-llm-prediction": "Option 2: Firstly, a container ship is shown, secondly a cargo train is shown.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The cargo train and the container ship are shown simultaneously.\nSentence B: In the video, first a container ship is shown, then a cargo train is shown.", "gt-answer": "Sentence B: In the video, first a container ship is shown, then a cargo train is shown.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A container ship is shown, then a cargo train is shown.\nCaption B: In the video, first a container ship is shown, then a cargo train is shown.", "gt-answer": "Caption B: In the video, first a container ship is shown, then a cargo train is shown.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1062609286": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The battery charge is decreasing.\nOption 2: The battery charge is increasing.", "gt-answer": "Option 2: The battery charge is increasing.", "video-llm-prediction": "Option 1: The battery charge is decreasing.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The battery charge is staying constant.\nCaption B: The battery charge is increasing.", "gt-answer": "Caption B: The battery charge is increasing.", "video-llm-prediction": "Caption B: The battery charge is increasing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The battery charge is decreasing.\nSentence B: The battery charge is increasing.", "gt-answer": "Sentence B: The battery charge is increasing.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1100397435": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A person is turning off the robot vacuum cleaner.\nOption 2: A person starts the robot vacuum cleaner.", "gt-answer": "Option 2: A person starts the robot vacuum cleaner.", "video-llm-prediction": "Option 2: A person starts the robot vacuum cleaner.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is fixing the robot vacuum cleaner.\nSentence B: A person starts the robot vacuum cleaner.", "gt-answer": "Sentence B: A person starts the robot vacuum cleaner.", "video-llm-prediction": "Sentence A: A person is fixing the robot vacuum cleaner.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: A person starts the robot vacuum cleaner.\nCaption B: A person is sweeping the floor.", "gt-answer": "Caption A: A person starts the robot vacuum cleaner.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The robot vacuum cleaner is moving to the right side of the screen.\nOption 2: The robot vacuum cleaner is moving to the left side of the screen.", "gt-answer": "Option 1: The robot vacuum cleaner is moving to the right side of the screen.", "video-llm-prediction": "Option 1: The robot vacuum cleaner is moving to the right side of the screen.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The robot vacuum cleaner is moving to the right side of the screen.\nCaption B: The robot vacuum cleaner is moving towards the screen.", "gt-answer": "Caption A: The robot vacuum cleaner is moving to the right side of the screen.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The robot vacuum cleaner is moving away from the screen.\nSentence B: The robot vacuum cleaner is moving to the right side of the screen.", "gt-answer": "Sentence B: The robot vacuum cleaner is moving to the right side of the screen.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The robot vacuum cleaner starts moving and then a person enters the screen.\nCaption B: A person enters the screen and then the robot vacuum cleaner starts moving.", "gt-answer": "Caption B: A person enters the screen and then the robot vacuum cleaner starts moving.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person enters the screen and then the robot vacuum cleaner starts moving.\nSentence B: The person starts moving before the robot vacuum cleaner.", "gt-answer": "Sentence A: A person enters the screen and then the robot vacuum cleaner starts moving.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person enters the screen and then the robot vacuum cleaner starts moving.\nOption 2: The robot vacuum cleaner moves first, followed by a person entering the screen.", "gt-answer": "Option 1: A person enters the screen and then the robot vacuum cleaner starts moving.", "video-llm-prediction": "Option 2: The robot vacuum cleaner moves first, followed by a person entering the screen.", "match_success": true, "rating": 0 } ] }, "1108534143": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The puppy is walking into a wigwam.\nOption 2: The puppy is walking out of a wigwam.", "gt-answer": "Option 2: The puppy is walking out of a wigwam.", "video-llm-prediction": "Option 2: The puppy is walking out of a wigwam.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The puppy is staying in a wigwam.\nCaption B: The puppy is walking out of a wigwam.", "gt-answer": "Caption B: The puppy is walking out of a wigwam.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The puppy is walking out of a wigwam.\nSentence B: The puppy is walking around a wigwam.", "gt-answer": "Sentence A: The puppy is walking out of a wigwam.", "video-llm-prediction": "Sentence A: The puppy is walking out of a wigwam.", "match_success": true, "rating": 1 } ] }, "1034049020": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A woman is painting a wall while walking in the video.\nSentence B: A woman is painting a wall while standing still in the video.", "gt-answer": "Sentence A: A woman is painting a wall while walking in the video.", "video-llm-prediction": "Sentence A: A woman is painting a wall while walking in the video.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A girl is walking and cleaning a wall.\nCaption B: A woman is painting a wall while walking in the video.", "gt-answer": "Caption B: A woman is painting a wall while walking in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A woman is painting a wall while walking in the video.\nOption 2: A girl painting a wall.", "gt-answer": "Option 1: A woman is painting a wall while walking in the video.", "video-llm-prediction": "Option 1: A woman is painting a wall while walking in the video.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The woman is turning back and then painting a wall while walking.\nCaption B: The woman is painting a wall while walking and then turning back.", "gt-answer": "Caption B: The woman is painting a wall while walking and then turning back.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The events are occurring in the order of painting a wall while walking, then turning back.\nOption 2: The order of events is turning back and painting the wall, then walking.", "gt-answer": "Option 1: The events are occurring in the order of painting a wall while walking, then turning back.", "video-llm-prediction": "Option 1: The events are occurring in the order of painting a wall while walking, then turning back.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The events are occurring in the order of painting a wall while walking, then turning back.\nSentence B: The events are happening in the order of turning back, then painting a wall while walking.", "gt-answer": "Sentence A: The events are occurring in the order of painting a wall while walking, then turning back.", "video-llm-prediction": "Sentence A: The events are occurring in the order of painting a wall while walking, then turning back.", "match_success": true, "rating": 1 } ] }, "1047368344": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl is jumping into the water.\nSentence B: The girl is jumping out of water.", "gt-answer": "Sentence A: The girl is jumping into the water.", "video-llm-prediction": "Sentence A: The girl is jumping into the water.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The girl is jumping around water.\nCaption B: The girl is jumping into the water.", "gt-answer": "Caption B: The girl is jumping into the water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The girl is swimming in the water.\nOption 2: The girl is jumping into the water.", "gt-answer": "Option 2: The girl is jumping into the water.", "video-llm-prediction": "Option 2: The girl is jumping into the water.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl first jumps into the water and then takes off her clothes.\nSentence B: The girl first takes off her clothes and then jumps into the water.", "gt-answer": "Sentence B: The girl first takes off her clothes and then jumps into the water.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The girl first takes off her clothes and then jumps into the water.\nCaption B: After jumping into the water, the girl takes off her clothes.", "gt-answer": "Caption A: The girl first takes off her clothes and then jumps into the water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The girl first takes off her clothes and then jumps into the water.\nOption 2: The girl puts on her clothes after jumping into the water.", "gt-answer": "Option 1: The girl first takes off her clothes and then jumps into the water.", "video-llm-prediction": "Option 2: The girl puts on her clothes after jumping into the water.", "match_success": true, "rating": 0 } ] }, "1060403198": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The tree is decreasing in height.\nSentence B: The tree is increasing in height.", "gt-answer": "Sentence B: The tree is increasing in height.", "video-llm-prediction": "Sentence A: The tree is decreasing in height.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The tree is growing taller.\nCaption B: The tree is becoming shorter.", "gt-answer": "Caption A: The tree is growing taller.", "video-llm-prediction": "Caption A: The tree is growing taller.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The tree is decreasing in height.\nOption 2: The tree is increasing in height.", "gt-answer": "Option 2: The tree is increasing in height.", "video-llm-prediction": "Option 1: The tree is decreasing in height.", "match_success": true, "rating": 0 } ] }, "1100074677": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person wrote something on the paper note and then stood the paper note up.\nSentence B: The person stood the paper note up and then wrote something on the paper note.", "gt-answer": "Sentence A: The person wrote something on the paper note and then stood the paper note up.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The person wrote something on the paper note and then stood the paper note up.\nCaption B: The person wrote something on the paper note and then tore it apart.", "gt-answer": "Caption A: The person wrote something on the paper note and then stood the paper note up.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person wrote something on the paper note and then stood the paper note up.\nOption 2: The person threw the paper note away and then tore it apart.", "gt-answer": "Option 1: The person wrote something on the paper note and then stood the paper note up.", "video-llm-prediction": "Option 1: The person wrote something on the paper note and then stood the paper note up.", "match_success": true, "rating": 1 } ] }, "1100350201": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The little girl is drawn first, then the man is drawn.\nCaption B: The man is drawn first, then the little girl disappears.", "gt-answer": "Caption A: The little girl is drawn first, then the man is drawn.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is drawn and then the little girl appears.\nOption 2: The little girl is drawn first, then the man is drawn.", "gt-answer": "Option 2: The little girl is drawn first, then the man is drawn.", "video-llm-prediction": "Option 2: The little girl is drawn first, then the man is drawn.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The little girl is drawn first, then the man is drawn.\nSentence B: The little girl is drawn and then the man gets erased and drawn.", "gt-answer": "Sentence A: The little girl is drawn first, then the man is drawn.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1099109715": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The number of fruits and vegetables is increasing.\nOption 2: The number of fruits and vegetables is decreasing.", "gt-answer": "Option 1: The number of fruits and vegetables is increasing.", "video-llm-prediction": "Option 1: The number of fruits and vegetables is increasing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The number of fruits and vegetables is increasing.\nSentence B: The fruits and vegetables are becoming rotten.", "gt-answer": "Sentence A: The number of fruits and vegetables is increasing.", "video-llm-prediction": "Sentence A: The number of fruits and vegetables is increasing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The number of fruits and vegetables is increasing.\nCaption B: The fruits and vegetables are staying the same.", "gt-answer": "Caption A: The number of fruits and vegetables is increasing.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1051211272": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The toast with cream cheese is gradually growing larger.\nSentence B: The toast with cream cheese is gradually being eaten out and disappearing.", "gt-answer": "Sentence B: The toast with cream cheese is gradually being eaten out and disappearing.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The toast with cream cheese is gradually being eaten out and disappearing.\nOption 2: The toast with cream cheese is gradually emerging piece by piece.", "gt-answer": "Option 1: The toast with cream cheese is gradually being eaten out and disappearing.", "video-llm-prediction": "Option 1: The toast with cream cheese is gradually being eaten out and disappearing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The toast with cream cheese is gradually growing larger.\nCaption B: The toast with cream cheese is gradually being eaten out and disappearing.", "gt-answer": "Caption B: The toast with cream cheese is gradually being eaten out and disappearing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1059815936": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The paper is changing from a wrinkled paper ball into a flattened sheet.\nSentence B: The paper is changing from a flattened sheet into a wrinkled paper ball.", "gt-answer": "Sentence A: The paper is changing from a wrinkled paper ball into a flattened sheet.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The paper is changing from a wrinkled paper ball into a flattened sheet.\nCaption B: The paper is disappearing.", "gt-answer": "Caption A: The paper is changing from a wrinkled paper ball into a flattened sheet.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The paper is changing from a wrinkled paper ball into a flattened sheet.\nOption 2: The paper is tearing apart.", "gt-answer": "Option 1: The paper is changing from a wrinkled paper ball into a flattened sheet.", "video-llm-prediction": "Option 1: The paper is changing from a wrinkled paper ball into a flattened sheet.", "match_success": true, "rating": 1 } ] }, "1086423566": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The bowl rotates and then food is added into the bowl.\nOption 2: Food is added into the bowl and then the bowl rotates.", "gt-answer": "Option 2: Food is added into the bowl and then the bowl rotates.", "video-llm-prediction": "Option 2: Food is added into the bowl and then the bowl rotates.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: In the video, food is added into the bowl first and then the bowl rotates.\nCaption B: The bowl flips upside down and then food is added into the bowl.", "gt-answer": "Caption A: In the video, food is added into the bowl first and then the bowl rotates.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Food is added into the bowl and then it disappears.\nSentence B: In the video, food is added into the bowl first and then the bowl rotates.", "gt-answer": "Sentence B: In the video, food is added into the bowl first and then the bowl rotates.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1069611487": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: First, pizza slices being taken away and then a paper box appears.\nSentence B: First, a paper box appears and then pizza slices being taken away.", "gt-answer": "Sentence B: First, a paper box appears and then pizza slices being taken away.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A pizza slice disappears before a paper box appears.\nOption 2: First, a paper box appears and then pizza slices disappear.", "gt-answer": "Option 2: First, a paper box appears and then pizza slices disappear.", "video-llm-prediction": "Option 2: First, a paper box appears and then pizza slices disappear.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: In the video, a paper box disappears before the pizza slices disappear.\nCaption B: First, a paper box appears and then pizza slices disappear.", "gt-answer": "Caption B: First, a paper box appears and then pizza slices disappear.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1083845854_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The clock hands are moving clockwise.\nOption 2: The clock hands are moving counterclockwise.", "gt-answer": "Option 2: The clock hands are moving counterclockwise.", "video-llm-prediction": "Option 1: The clock hands are moving clockwise.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The clock hands are moving counterclockwise.\nSentence B: The clock hands are moving clockwise.", "gt-answer": "Sentence A: The clock hands are moving counterclockwise.", "video-llm-prediction": "Sentence A: The clock hands are moving counterclockwise.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The clock hands are rotating counterclockwise.\nCaption B: The clock hands are rotating clockwise.", "gt-answer": "Caption A: The clock hands are rotating counterclockwise.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1100329207_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The camera view is moving right.\nOption 2: The camera view is moving backward.", "gt-answer": "Option 2: The camera view is moving backward.", "video-llm-prediction": "Option 1: The camera view is moving right.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera view is moving forward.\nCaption B: The camera view is moving backward.", "gt-answer": "Caption B: The camera view is moving backward.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera view is moving backward.\nSentence B: The camera view is moving left.", "gt-answer": "Sentence A: The camera view is moving backward.", "video-llm-prediction": "Sentence A: The camera view is moving backward.", "match_success": true, "rating": 1 } ] }, "1089201973_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The football is moving from right to left.\nOption 2: The football is moving from left to right in the video.", "gt-answer": "Option 1: The football is moving from right to left.", "video-llm-prediction": "Option 2: The football is moving from left to right in the video.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The football is moving from left to right in the video.\nSentence B: The football is moving from right to left in the video.", "gt-answer": "Sentence B: The football is moving from right to left in the video.", "video-llm-prediction": "Sentence A: The football is moving from left to right in the video.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The football is moving upwards.\nCaption B: The football is moving from right to left in the video.", "gt-answer": "Caption B: The football is moving from right to left in the video.", "video-llm-prediction": "Caption A: The football is moving upwards.", "match_success": true, "rating": 0 } ] }, "1034736653_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman athletes are running from right to left.\nOption 2: The woman athletes are running from left to right.", "gt-answer": "Option 1: The woman athletes are running from right to left.", "video-llm-prediction": "Option 2: The woman athletes are running from left to right.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman athletes are running from left to right.\nSentence B: The woman athletes are running from right to left.", "gt-answer": "Sentence B: The woman athletes are running from right to left.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The woman athletes are running from top to bottom.\nCaption B: The woman athletes are running from right to left.", "gt-answer": "Caption B: The woman athletes are running from right to left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1084153195_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The dolphins are hovering in one place.\nCaption B: The dolphins are swimming away from the shore.", "gt-answer": "Caption B: The dolphins are swimming away from the shore.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dolphins are swimming away from the shore.\nSentence B: The dolphins are swimming towards the shore.", "gt-answer": "Sentence A: The dolphins are swimming away from the shore.", "video-llm-prediction": "Sentence A: The dolphins are swimming away from the shore.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The dolphins are swimming away from the shore.\nOption 2: The dolphins are swimming parallel to the shore.", "gt-answer": "Option 1: The dolphins are swimming away from the shore.", "video-llm-prediction": "Option 2: The dolphins are swimming parallel to the shore.", "match_success": true, "rating": 0 } ] }, "1081092839_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The sun is descending.\nCaption B: The sun is ascending.", "gt-answer": "Caption B: The sun is ascending.", "video-llm-prediction": "Caption B: The sun is ascending.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun is moving upwards.\nSentence B: The sun is moving downwards.", "gt-answer": "Sentence A: The sun is moving upwards.", "video-llm-prediction": "Sentence B: The sun is moving downwards.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun is descending.\nOption 2: The sun is rising.", "gt-answer": "Option 2: The sun is rising.", "video-llm-prediction": "Option 2: The sun is rising.", "match_success": true, "rating": 1 } ] }, "1059462749_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is moving upwards.\nSentence B: The person is moving rightwards.", "gt-answer": "Sentence A: The person is moving upwards.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is moving downwards.\nOption 2: The person is moving upwards.", "gt-answer": "Option 2: The person is moving upwards.", "video-llm-prediction": "Option 2: The person is moving upwards.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The person is moving upwards.\nCaption B: The person is moving leftwards.", "gt-answer": "Caption A: The person is moving upwards.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1088279109_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The elevator is rising.\nSentence B: The elevator is going down.", "gt-answer": "Sentence B: The elevator is going down.", "video-llm-prediction": "Sentence A: The elevator is rising.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The elevator is staying still.\nCaption B: The elevator is going down.", "gt-answer": "Caption B: The elevator is going down.", "video-llm-prediction": "Caption B: The elevator is going down.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The elevator is going down.\nOption 2: The elevator is not moving.", "gt-answer": "Option 1: The elevator is going down.", "video-llm-prediction": "Option 2: The elevator is not moving.", "match_success": true, "rating": 0 } ] }, "1096612823_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is zooming in.\nOption 2: The video is zooming out.", "gt-answer": "Option 2: The video is zooming out.", "video-llm-prediction": "Option 2: The video is zooming out.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is zooming out.\nCaption B: The video is rotating.", "gt-answer": "Caption A: The video is zooming out.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is zooming out.\nSentence B: The video is panning left.", "gt-answer": "Sentence A: The video is zooming out.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 } ] }, "1075484900_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The child is turning away from the man.\nSentence B: The child is turning towards the man.", "gt-answer": "Sentence B: The child is turning towards the man.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The child is turning towards the man.\nOption 2: The child is turning away from the man.", "gt-answer": "Option 1: The child is turning towards the man.", "video-llm-prediction": "Option 2: The child is turning away from the man.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The child is moving forward in relation to the man.\nCaption B: The child is turning away from the man.", "gt-answer": "Caption A: The child is moving forward in relation to the man.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1090578917_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The man is leaping to his left.\nCaption B: The man is leaping to his right.", "gt-answer": "Caption A: The man is leaping to his left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is leaping to his left.\nSentence B: The man is leaping backward.", "gt-answer": "Sentence A: The man is leaping to his left.", "video-llm-prediction": "Sentence A: The man is leaping to his left.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is leaping to his left.\nOption 2: The man is leaping forward.", "gt-answer": "Option 1: The man is leaping to his left.", "video-llm-prediction": "Option 2: The man is leaping forward.", "match_success": true, "rating": 0 } ] }, "1075338140_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ball is rolling from right to left.\nSentence B: The ball is rolling from left to right.", "gt-answer": "Sentence A: The ball is rolling from right to left.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The ball is rolling from left to right.\nCaption B: The ball is rolling from right to left.", "gt-answer": "Caption B: The ball is rolling from right to left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ball is rolling from right to left.\nOption 2: The ball is rolling from left to right.", "gt-answer": "Option 1: The ball is rolling from right to left.", "video-llm-prediction": "Option 1: The ball is rolling from right to left.", "match_success": true, "rating": 1 } ] }, "1067268403_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The wind turbines are stationary.\nCaption B: The wind turbines are rotating counterclockwise.", "gt-answer": "Caption B: The wind turbines are rotating counterclockwise.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The wind turbines are rotating counterclockwise.\nSentence B: The wind turbines are rotating clockwise.", "gt-answer": "Sentence A: The wind turbines are rotating counterclockwise.", "video-llm-prediction": "Sentence A: The wind turbines are rotating counterclockwise.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The wind turbines are rotating counterclockwise.\nOption 2: The wind turbines are rotating clockwise.", "gt-answer": "Option 1: The wind turbines are rotating counterclockwise.", "video-llm-prediction": "Option 1: The wind turbines are rotating counterclockwise.", "match_success": true, "rating": 1 } ] }, "1096007487_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3d cloud is moving upward from the camera's point of view.\nSentence B: The 3d cloud is moving rightward from the camera's point of view.", "gt-answer": "Sentence B: The 3d cloud is moving rightward from the camera's point of view.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The 3d cloud is moving downward from the camera's point of view.\nCaption B: The 3d cloud is moving rightward from the camera's point of view.", "gt-answer": "Caption B: The 3d cloud is moving rightward from the camera's point of view.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3d cloud is moving rightward from the camera's point of view.\nOption 2: The 3d cloud is moving leftward from the camera's point of view.", "gt-answer": "Option 1: The 3d cloud is moving rightward from the camera's point of view.", "video-llm-prediction": "Option 1: The 3d cloud is moving rightward from the camera's point of view.", "match_success": true, "rating": 1 } ] }, "1095939659_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The light is growing counterclockwise.\nCaption B: The light is growing downwards.", "gt-answer": "Caption A: The light is growing counterclockwise.", "video-llm-prediction": "Caption A: The light is growing counterclockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The light is growing counterclockwise.\nSentence B: The light is growing clockwise.", "gt-answer": "Sentence A: The light is growing counterclockwise.", "video-llm-prediction": "Sentence A: The light is growing counterclockwise.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The light is growing counterclockwise.\nOption 2: The light is moving straight forward.", "gt-answer": "Option 1: The light is growing counterclockwise.", "video-llm-prediction": "Option 1: The light is growing counterclockwise.", "match_success": true, "rating": 1 } ] }, "1098785169_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The galaxy is spinning counterclockwise.\nCaption B: The galaxy is rotating clockwise.", "gt-answer": "Caption A: The galaxy is spinning counterclockwise.", "video-llm-prediction": "Caption A: The galaxy is spinning counterclockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The galaxy's spin is counterclockwise.\nSentence B: The galaxy is rotating clockwise.", "gt-answer": "Sentence A: The galaxy's spin is counterclockwise.", "video-llm-prediction": "Sentence A: The galaxy's spin is counterclockwise.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The rotation of the galaxy is counterclockwise.\nOption 2: The galaxy is rotating clockwise.", "gt-answer": "Option 1: The rotation of the galaxy is counterclockwise.", "video-llm-prediction": "Option 1: The galaxy is rotating counterclockwise.", "match_success": false, "chatgpt-response": "Incorrect", "rating": 0 } ] }, "1099984801_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The clouds are moving away from the camera.\nSentence B: The clouds are moving towards the camera.", "gt-answer": "Sentence A: The clouds are moving away from the camera.", "video-llm-prediction": "Sentence B: The clouds are moving towards the camera.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The clouds are moving away from the camera.\nOption 2: The clouds are staying still.", "gt-answer": "Option 1: The clouds are moving away from the camera.", "video-llm-prediction": "Option 1: The clouds are moving away from the camera.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The clouds are moving away from the camera.\nCaption B: The clouds are moving towards the camera.", "gt-answer": "Caption A: The clouds are moving away from the camera.", "video-llm-prediction": "Caption B: The clouds are moving towards the camera.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The brightness of the video is staying the same.\nOption 2: The entire video is getting brighter.", "gt-answer": "Option 2: The entire video is getting brighter.", "video-llm-prediction": "Option 2: The entire video is getting brighter.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The entire video is getting darker.\nCaption B: The video is getting brighter.", "gt-answer": "Caption B: The video is getting brighter.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The entire video is getting darker.\nSentence B: The entire video is getting brighter.", "gt-answer": "Sentence B: The entire video is getting brighter.", "video-llm-prediction": "Sentence B: The entire video is getting brighter.", "match_success": true, "rating": 1 } ] }, "1082419672_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The movement in the video is flying upwards relative to the ship.\nOption 2: The movement in the video is flying forwards relative to the ship.", "gt-answer": "Option 2: The movement in the video is flying forwards relative to the ship.", "video-llm-prediction": "Option 1: The movement in the video is flying upwards relative to the ship.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The movement in the video is flying backwards relative to the ship.\nSentence B: The movement in the video is flying forwards relative to the ship.", "gt-answer": "Sentence B: The movement in the video is flying forwards relative to the ship.", "video-llm-prediction": "Sentence A: The movement in the video is flying backwards relative to the ship.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The movement in the video is flying backwards relative to the ship.\nCaption B: The movement in the video is flying forwards relative to the ship.", "gt-answer": "Caption B: The movement in the video is flying forwards relative to the ship.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1058985719_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The airplane is moving from right to left.\nCaption B: The airplane is flying from top to bottom.", "gt-answer": "Caption B: The airplane is flying from top to bottom.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The airplane is flying from bottom to top.\nOption 2: The airplane is flying from top to bottom.", "gt-answer": "Option 2: The airplane is flying from top to bottom.", "video-llm-prediction": "Option 2: The airplane is flying from top to bottom.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The airplane is flying from top to bottom.\nSentence B: The airplane is moving from left to right.", "gt-answer": "Sentence A: The airplane is flying from top to bottom.", "video-llm-prediction": "Sentence A: The airplane is flying from top to bottom.", "match_success": true, "rating": 1 } ] }, "1055413730_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The planet Earth is spinning to the left.\nOption 2: The planet Earth is spinning to the right.", "gt-answer": "Option 1: The planet Earth is spinning to the left.", "video-llm-prediction": "Option 2: The planet Earth is spinning to the right.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The planet Earth is spinning to the left.\nCaption B: The Earth is rotating upward.", "gt-answer": "Caption A: The planet Earth is spinning to the left.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The planet Earth is spinning to the left.\nSentence B: The planet Earth is spinning to the right.", "gt-answer": "Sentence A: The planet Earth is spinning to the left.", "video-llm-prediction": "Sentence A: The planet Earth is spinning to the left.", "match_success": true, "rating": 1 } ] }, "1081684532_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The asteroids in the video are flying towards the camera.\nSentence B: The asteroids are flying away from the camera.", "gt-answer": "Sentence B: The asteroids are flying away from the camera.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The asteroids in the video are flying away from the camera.\nOption 2: The asteroids are flying to the left.", "gt-answer": "Option 1: The asteroids in the video are flying away from the camera.", "video-llm-prediction": "Option 1: The asteroids in the video are flying away from the camera.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The asteroids are flying to the right.\nCaption B: The asteroids in the video are flying away from the camera.", "gt-answer": "Caption B: The asteroids in the video are flying away from the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "23391142_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is panning upwards.\nOption 2: The video is panning to the left.", "gt-answer": "Option 2: The video is panning to the left.", "video-llm-prediction": "Option 2: The video is panning to the left.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is zooming in.\nCaption B: The video is panning to the left.", "gt-answer": "Caption B: The video is panning to the left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is panning to the right.\nSentence B: The video is panning to the left.", "gt-answer": "Sentence B: The video is panning to the left.", "video-llm-prediction": "Sentence A: The video is panning to the right.", "match_success": true, "rating": 0 } ] }, "1053758117_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The camera is standing still before a 3D digital brain.\nCaption B: The camera is zooming out from a 3D digital brain.", "gt-answer": "Caption B: The camera is zooming out from a 3D digital brain.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is zooming out from a 3D digital brain.\nOption 2: The camera is zooming into a 3D digital brain.", "gt-answer": "Option 1: The camera is zooming out from a 3D digital brain.", "video-llm-prediction": "Option 2: The camera is zooming into a 3D digital brain.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming out from a 3D digital brain.\nSentence B: The camera is moving downwards.", "gt-answer": "Sentence A: The camera is zooming out from a 3D digital brain.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1106668103_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is staying still.\nOption 2: The movement in the video is backward.", "gt-answer": "Option 2: The movement in the video is backward.", "video-llm-prediction": "Option 2: The movement in the video is backward.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The movement in the video is forward.\nCaption B: The movement in the video is backward.", "gt-answer": "Caption B: The movement in the video is backward.", "video-llm-prediction": "Caption A: The movement in the video is forward.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The movement in the video is backward.\nSentence B: The primary motion depicted in the video is turning in circles.", "gt-answer": "Sentence A: The movement in the video is backward.", "video-llm-prediction": "Sentence A: The movement in the video is backward.", "match_success": true, "rating": 1 } ] }, "1057163434_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The chef is removing the bread from the top of the burger.\nCaption B: The chef is putting the bread on top of the burger.", "gt-answer": "Caption A: The chef is removing the bread from the top of the burger.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The chef is putting the bread on top of the burger.\nOption 2: The chef is removing the bread from the top of the burger.", "gt-answer": "Option 2: The chef is removing the bread from the top of the burger.", "video-llm-prediction": "Option 2: The chef is removing the bread from the top of the burger.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The chef is putting the bread on top of the burger.\nSentence B: The chef is removing the bread from the top of the burger.", "gt-answer": "Sentence B: The chef is removing the bread from the top of the burger.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1100319395_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The circular pattern is moving counter-clockwise.\nCaption B: The circular pattern is moving clockwise.", "gt-answer": "Caption A: The circular pattern is moving counter-clockwise.", "video-llm-prediction": "Caption B: The circular pattern is moving clockwise.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The circular pattern is moving clockwise.\nOption 2: The circular pattern is spinning counter-clockwise.", "gt-answer": "Option 2: The circular pattern is spinning counter-clockwise.", "video-llm-prediction": "Option 1: The circular pattern is moving clockwise.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The circular pattern is vibrating back and forth.\nSentence B: The circular pattern is moving counter-clockwise.", "gt-answer": "Sentence B: The circular pattern is moving counter-clockwise.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1101200293_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is moving counterclockwise around the aircraft carrier.\nSentence B: The camera is moving clockwise around the aircraft carrier.", "gt-answer": "Sentence A: The camera is moving counterclockwise around the aircraft carrier.", "video-llm-prediction": "Sentence A: The camera is moving counterclockwise around the aircraft carrier.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The camera is moving counterclockwise around the aircraft carrier.\nCaption B: The camera is tilting upwardsaround the aircraft carrier.", "gt-answer": "Caption A: The camera is moving counterclockwise around the aircraft carrier.", "video-llm-prediction": "Caption A: The camera is moving counterclockwise around the aircraft carrier.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is moving counterclockwise around the aircraft carrier.\nOption 2: The camera is moving back and forth around the aircraft carrier.", "gt-answer": "Option 1: The camera is moving counterclockwise around the aircraft carrier.", "video-llm-prediction": "Option 1: The camera is moving counterclockwise around the aircraft carrier.", "match_success": true, "rating": 1 } ] }, "1072453637_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is panning to the front of a fighter jet.\nSentence B: The camera is panning downwards around a fighter jet.", "gt-answer": "Sentence A: The camera is panning to the front of a fighter jet.", "video-llm-prediction": "Sentence A: The camera is panning to the front of a fighter jet.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning to the front of a fighter jet.\nOption 2: The camera is panning upwards around a fighter jet.", "gt-answer": "Option 1: The camera is panning to the front of a fighter jet.", "video-llm-prediction": "Option 2: The camera is panning upwards around a fighter jet.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera is panning to the back of a fighter jet.\nCaption B: The camera is panning to the front of a fighter jet.", "gt-answer": "Caption B: The camera is panning to the front of a fighter jet.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "3396473605_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The five stars appear from left to right.\nSentence B: The five stars disappear from right to left.", "gt-answer": "Sentence B: The five stars disappear from right to left.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The five stars disappear from right to left.\nOption 2: The five stars appear from top to bottom.", "gt-answer": "Option 1: The five stars disappear from right to left.", "video-llm-prediction": "Option 2: The five stars appear from top to bottom.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The five stars disappear from right to left.\nCaption B: The five stars appear from bottom to top.", "gt-answer": "Caption A: The five stars disappear from right to left.", "video-llm-prediction": "Caption B: The five stars appear from bottom to top.", "match_success": true, "rating": 0 } ] }, "1086820415_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The large wave is moving horizontally towards the right side of the screen.\nSentence B: The large wave is moving vertically towards the top of the screen.", "gt-answer": "Sentence B: The large wave is moving vertically towards the top of the screen.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The large wave is moving vertically towards the top of the screen.\nOption 2: The large wave is moving vertically towards the bottom of the screen.", "gt-answer": "Option 1: The large wave is moving vertically towards the top of the screen.", "video-llm-prediction": "Option 1: The large wave is moving vertically towards the top of the screen.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The large wave is moving vertically towards the top of the screen.\nCaption B: The large wave is moving diagonally towards the top-left corner.", "gt-answer": "Caption A: The large wave is moving vertically towards the top of the screen.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1073831006_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The zebras are moving from right to left.\nCaption B: The zebras are moving from left to right.", "gt-answer": "Caption A: The zebras are moving from right to left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The zebras are moving from right to left.\nOption 2: The zebras are moving from top to bottom.", "gt-answer": "Option 1: The zebras are moving from right to left.", "video-llm-prediction": "Option 1: The zebras are moving from right to left.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The zebras are moving away from the camera.\nSentence B: The zebras are moving from right to left.", "gt-answer": "Sentence B: The zebras are moving from right to left.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1024867412_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The car is taking a right turn.\nCaption B: The car is taking a left turn.", "gt-answer": "Caption B: The car is taking a left turn.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The car is going backward.\nSentence B: The car is taking a left turn.", "gt-answer": "Sentence B: The car is taking a left turn.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The car is taking a left turn.\nOption 2: The car is moving forward.", "gt-answer": "Option 1: The car is taking a left turn.", "video-llm-prediction": "Option 2: The car is moving forward.", "match_success": true, "rating": 0 } ] }, "1076877854_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The robotic arm is moving to the left side of the screen.\nSentence B: The closest robotic arm is moving to the right side of the screen.", "gt-answer": "Sentence A: The robotic arm is moving to the left side of the screen.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The closest robotic arm is moving to the left side of the screen.\nCaption B: The robotic arm is moving away from the camera.", "gt-answer": "Caption A: The closest robotic arm is moving to the left side of the screen.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The robotic arm is rotating.\nOption 2: The closest robotic arm is moving to the left side of the screen.", "gt-answer": "Option 2: The closest robotic arm is moving to the left side of the screen.", "video-llm-prediction": "Option 2: The closest robotic arm is moving to the left side of the screen.", "match_success": true, "rating": 1 } ] }, "1100468035_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The camera is zooming backward in the video.\nCaption B: The camera is zooming forward in the video.", "gt-answer": "Caption A: The camera is zooming backward in the video.", "video-llm-prediction": "Caption B: The camera is zooming forward in the video.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming backward in the video.\nSentence B: The camera is tracking right.", "gt-answer": "Sentence A: The camera is zooming backward in the video.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning left.\nOption 2: The camera is zooming backward in the video.", "gt-answer": "Option 2: The camera is zooming backward in the video.", "video-llm-prediction": "Option 1: The camera is panning left.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The door is gradually closing.\nCaption B: The door is gradually opening.", "gt-answer": "Caption A: The door is gradually closing.", "video-llm-prediction": "Caption B: The door is gradually opening.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The door is gradually closing.\nSentence B: The door is remaining closed.", "gt-answer": "Sentence A: The door is gradually closing.", "video-llm-prediction": "Sentence A: The door is gradually closing.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The door is gradually opening.\nOption 2: The door is gradually closing.", "gt-answer": "Option 2: The door is gradually closing.", "video-llm-prediction": "Option 2: The door is gradually closing.", "match_success": true, "rating": 1 } ] }, "3411806181_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The person is unplugging the charging gun from the car.\nOption 2: The person is plugging the charging gun into the car.", "gt-answer": "Option 1: The person is unplugging the charging gun from the car.", "video-llm-prediction": "Option 2: The person is plugging the charging gun into the car.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is moving the charging gun away from the car.\nSentence B: The person is plugging the charging gun into the car.", "gt-answer": "Sentence A: The person is moving the charging gun away from the car.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person is holding the charging gun still.\nCaption B: The person is unplugging the charging gun from the car.", "gt-answer": "Caption B: The person is unplugging the charging gun from the car.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1073914229_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The trains are moving towards each other.\nSentence B: The trains are moving away from each other.", "gt-answer": "Sentence B: The trains are moving away from each other.", "video-llm-prediction": "Sentence A: The trains are moving towards each other.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The trains are moving away from each other.\nOption 2: The trains are moving towards each other.", "gt-answer": "Option 1: The trains are moving away from each other.", "video-llm-prediction": "Option 2: The trains are moving towards each other.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The trains are moving towards each other.\nCaption B: The trains are moving away from each other.", "gt-answer": "Caption B: The trains are moving away from each other.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1093139559_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming out from three football players.\nSentence B: The camera is zooming into three football players.", "gt-answer": "Sentence A: The camera is zooming out from three football players.", "video-llm-prediction": "Sentence B: The camera is zooming into three football players.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera is zooming out from three football players.\nCaption B: The camera is panning left.", "gt-answer": "Caption A: The camera is zooming out from three football players.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is zooming out from three football players.\nOption 2: The camera is panning right.", "gt-answer": "Option 1: The camera is zooming out from three football players.", "video-llm-prediction": "Option 1: The camera is zooming out from three football players.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The light on the football players is turning brighter.\nOption 2: The light on the football players is turning darker.", "gt-answer": "Option 2: The light on the football players is turning darker.", "video-llm-prediction": "Option 2: The light on the football players is turning darker.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The light on the football players is staying the same.\nCaption B: The light on the football players is turning darker.", "gt-answer": "Caption B: The light on the football players is turning darker.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The light on the football players is dimming.\nSentence B: The light on the football players is turning brighter.", "gt-answer": "Sentence A: The light on the football players is dimming.", "video-llm-prediction": "Sentence B: The light on the football players is turning brighter.", "match_success": true, "rating": 0 } ] }, "1080591311_reverse": { "direction": [ { "question": "Which caption matches the video better?\nCaption A: The jellyfish is floating downwards.\nCaption B: The jellyfish is floating upwards.", "gt-answer": "Caption A: The jellyfish is floating downwards.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The jellyfish is moving towards the right.\nSentence B: The jellyfish is floating downwards.", "gt-answer": "Sentence B: The jellyfish is floating downwards.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The jellyfish is sinking downwards.\nOption 2: The jellyfish is floating upwards.", "gt-answer": "Option 1: The jellyfish is sinking downwards.", "video-llm-prediction": "Option 1: The jellyfish is sinking downwards.", "match_success": true, "rating": 1 } ] }, "3411228673_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is moving upwards along the skyscraper buildings.\nSentence B: The camera is moving downwards along the skyscraper buildings.", "gt-answer": "Sentence B: The camera is moving downwards along the skyscraper buildings.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The movement in the video is downwards among skyscraper buildings.\nOption 2: The camera is moving backwards.", "gt-answer": "Option 1: The movement in the video is downwards among skyscraper buildings.", "video-llm-prediction": "Option 1: The movement in the video is downwards among skyscraper buildings.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The movement in the video is upwards among skyscraper buildings.\nCaption B: The camera is moving downwards.", "gt-answer": "Caption B: The camera is moving downwards.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1093737353_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is panning to the left.\nSentence B: The camera is panning to the right.", "gt-answer": "Sentence A: The camera is panning to the left.", "video-llm-prediction": "Sentence B: The camera is panning to the right.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The camera is panning to the left.\nCaption B: The camera is tilting up.", "gt-answer": "Caption A: The camera is panning to the left.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning to the left.\nOption 2: The camera is zooming in.", "gt-answer": "Option 1: The camera is panning to the left.", "video-llm-prediction": "Option 2: The camera is zooming in.", "match_success": true, "rating": 0 } ] }, "1017768724_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The person is moving leftwards.\nOption 2: The person is moving rightwards.", "gt-answer": "Option 1: The person is moving leftwards.", "video-llm-prediction": "Option 2: The person is moving rightwards.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person is moving leftwards.\nSentence B: The person is moving upwards.", "gt-answer": "Sentence A: The person is moving leftwards.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The person is moving downwards.\nCaption B: The person is moving leftwards.", "gt-answer": "Caption B: The person is moving leftwards.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1100117263_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The little lion is jumping onto the back of an adult lion.\nSentence B: The little lion is falling from the back of an adult lion.", "gt-answer": "Sentence A: The little lion is jumping onto the back of an adult lion.", "video-llm-prediction": "Sentence A: The little lion is jumping onto the back of an adult lion.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The little lion is sitting nearby an adult lion.\nCaption B: The little lion is jumping onto the back of an adult lion.", "gt-answer": "Caption B: The little lion is jumping onto the back of an adult lion.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The little lion is jumping onto the back of an adult lion.\nOption 2: The little lion is sitting on the back of an adult lion.", "gt-answer": "Option 1: The little lion is jumping onto the back of an adult lion.", "video-llm-prediction": "Option 2: The little lion is sitting on the back of an adult lion.", "match_success": true, "rating": 0 } ] }, "1021488277_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is dropping down the pineapple.\nSentence B: A person is picking up the pineapple.", "gt-answer": "Sentence A: A person is dropping down the pineapple.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pineapple is being rotated by a person.\nOption 2: A person is dropping down the pineapple.", "gt-answer": "Option 2: A person is dropping down the pineapple.", "video-llm-prediction": "Option 1: The pineapple is being rotated by a person.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: A person is dropping down the pineapple.\nCaption B: The pineapple is being pushed forward by a person.", "gt-answer": "Caption A: A person is dropping down the pineapple.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1100397435_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The robot vacuum cleaner is moving to the right side of the screen.\nOption 2: The robot vacuum cleaner is moving to the left side of the screen.", "gt-answer": "Option 2: The robot vacuum cleaner is moving to the left side of the screen.", "video-llm-prediction": "Option 1: The robot vacuum cleaner is moving to the right side of the screen.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The robot vacuum cleaner is moving to the left side of the screen.\nCaption B: The robot vacuum cleaner is moving towards the screen.", "gt-answer": "Caption A: The robot vacuum cleaner is moving to the left side of the screen.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The robot vacuum cleaner is moving away from the screen.\nSentence B: The robot vacuum cleaner is moving to the left side of the screen.", "gt-answer": "Sentence B: The robot vacuum cleaner is moving to the left side of the screen.", "video-llm-prediction": "Sentence A: The robot vacuum cleaner is moving away from the screen.", "match_success": true, "rating": 0 } ] }, "1108534143_reverse": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The puppy is walking into a wigwam.\nOption 2: The puppy is walking out of a wigwam.", "gt-answer": "Option 1: The puppy is walking into a wigwam.", "video-llm-prediction": "Option 1: The puppy is walking into a wigwam.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The puppy is staying in a wigwam.\nCaption B: The puppy is walking into a wigwam.", "gt-answer": "Caption B: The puppy is walking into a wigwam.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The puppy is walking into a wigwam.\nSentence B: The puppy is walking around a wigwam.", "gt-answer": "Sentence A: The puppy is walking into a wigwam.", "video-llm-prediction": "Sentence A: The puppy is walking into a wigwam.", "match_success": true, "rating": 1 } ] }, "1047368344_reverse": { "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl is jumping into the water.\nSentence B: The girl is jumping out of water.", "gt-answer": "Sentence B: The girl is jumping out of water.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The girl is jumping around water.\nCaption B: The girl is jumping out of the water.", "gt-answer": "Caption B: The girl is jumping out of the water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The girl is swimming in the water.\nOption 2: The girl is jumping out of the water.", "gt-answer": "Option 2: The girl is jumping out of the water.", "video-llm-prediction": "Option 2: The girl is jumping out of the water.", "match_success": true, "rating": 1 } ] }, "1050618460_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The flowers are withering.\nSentence B: The flowers are turning into full bloom.", "gt-answer": "Sentence A: The flowers are withering.", "video-llm-prediction": "Sentence B: The flowers are turning into full bloom.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The flowers are turning into full bloom.\nCaption B: The flowers are shrinking and wilting.", "gt-answer": "Caption B: The flowers are shrinking and wilting.", "video-llm-prediction": "Caption A: The flowers are turning into full bloom.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The flowers are withering.\nOption 2: The flowers are turning into buds.", "gt-answer": "Option 1: The flowers are withering.", "video-llm-prediction": "Option 2: The flowers are turning into buds.", "match_success": true, "rating": 0 } ] }, "1083113449_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The sky is maintaining its brightness.\nCaption B: The sky is getting brighter.", "gt-answer": "Caption B: The sky is getting brighter.", "video-llm-prediction": "Caption B: The sky is getting brighter.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sky is lightening up.\nOption 2: The sky is getting darker.", "gt-answer": "Option 1: The sky is lightening up.", "video-llm-prediction": "Option 2: The sky is getting darker.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sky is getting darker.\nSentence B: The sky is brightening.", "gt-answer": "Sentence B: The sky is brightening.", "video-llm-prediction": "Sentence B: The sky is brightening.", "match_success": true, "rating": 1 } ] }, "1091143117_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The eye is changing from open to closed.\nOption 2: The eye is blinking rapidly.", "gt-answer": "Option 1: The eye is changing from open to closed.", "video-llm-prediction": "Option 1: The eye is changing from open to closed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The eye is changing from closed to open.\nCaption B: The eye is changing from open to closed.", "gt-answer": "Caption B: The eye is changing from open to closed.", "video-llm-prediction": "Caption B: The eye is changing from open to closed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The eye is changing from closed to open.\nSentence B: The eye is changing from open to closed.", "gt-answer": "Sentence B: The eye is changing from open to closed.", "video-llm-prediction": "Sentence A: The eye is changing from closed to open.", "match_success": true, "rating": 0 } ] }, "1098153561_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The leaves are changing color from green to yellow.\nCaption B: The leaves are changing color from yellow to green.", "gt-answer": "Caption B: The leaves are changing color from yellow to green.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The leaves are changing color from yellow to green.\nSentence B: The leaves are changing color from green to yellow.", "gt-answer": "Sentence A: The leaves are changing color from yellow to green.", "video-llm-prediction": "Sentence A: The leaves are changing color from yellow to green.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The leaves are changing color from yellow to green.\nOption 2: The leaves are changing color from green to yellow.", "gt-answer": "Option 1: The leaves are changing color from yellow to green.", "video-llm-prediction": "Option 1: The leaves are changing color from yellow to green.", "match_success": true, "rating": 1 } ] }, "1059072773_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The ice cream is melting.\nCaption B: The ice cream is freezing.", "gt-answer": "Caption B: The ice cream is freezing.", "video-llm-prediction": "Caption A: The ice cream is melting.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ice cream is evaporating.\nOption 2: The ice cream is freezing.", "gt-answer": "Option 2: The ice cream is freezing.", "video-llm-prediction": "Option 1: The ice cream is evaporating.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream is melting.\nSentence B: The ice cream is solidifying.", "gt-answer": "Sentence B: The ice cream is solidifying.", "video-llm-prediction": "Sentence A: The ice cream is melting.", "match_success": true, "rating": 0 } ] }, "1093573255_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The plant is reviving.\nOption 2: The plant is wilting.", "gt-answer": "Option 2: The plant is wilting.", "video-llm-prediction": "Option 1: The plant is reviving.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The plant is decaying.\nSentence B: The plant is reviving.", "gt-answer": "Sentence A: The plant is decaying.", "video-llm-prediction": "Sentence B: The plant is reviving.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The plant is reviving.\nCaption B: The plant is wilting.", "gt-answer": "Caption B: The plant is wilting.", "video-llm-prediction": "Caption A: The plant is reviving.", "match_success": true, "rating": 0 } ] }, "1077146132_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is turning darker.\nOption 2: The video is turning brighter.", "gt-answer": "Option 1: The video is turning darker.", "video-llm-prediction": "Option 2: The video is turning brighter.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is staying the same brightness.\nSentence B: The video is turning darker.", "gt-answer": "Sentence B: The video is turning darker.", "video-llm-prediction": "Sentence B: The video is turning darker.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is decreasing in brightness.\nCaption B: The video is turning brighter.", "gt-answer": "Caption A: The video is decreasing in brightness.", "video-llm-prediction": "Caption A: The video is decreasing in brightness.", "match_success": true, "rating": 1 } ] }, "1086688682_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The traffic lights are changing from red to yellow.\nSentence B: The traffic lights are changing from green to red.", "gt-answer": "Sentence B: The traffic lights are changing from green to red.", "video-llm-prediction": "Sentence A: The traffic lights are changing from red to yellow.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The traffic lights are changing from yellow to red.\nCaption B: The traffic lights are changing from green to red.", "gt-answer": "Caption B: The traffic lights are changing from green to red.", "video-llm-prediction": "Caption B: The traffic lights are changing from green to red.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The traffic lights are changing from green to red.\nOption 2: The traffic lights are changing from red to green.", "gt-answer": "Option 1: The traffic lights are changing from green to red.", "video-llm-prediction": "Option 1: The traffic lights are changing from green to red.", "match_success": true, "rating": 1 } ] }, "1099738787_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The concrete wall is falling apart.\nCaption B: The concrete wall is assembling together.", "gt-answer": "Caption B: The concrete wall is assembling together.", "video-llm-prediction": "Caption B: The concrete wall is assembling together.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The concrete wall is falling apart.\nOption 2: The concrete wall is growing taller.", "gt-answer": "Option 2: The concrete wall is growing taller.", "video-llm-prediction": "Option 1: The concrete wall is falling apart.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The concrete wall is assembling together.\nSentence B: The concrete wall is falling apart.", "gt-answer": "Sentence A: The concrete wall is assembling together.", "video-llm-prediction": "Sentence B: The concrete wall is falling apart.", "match_success": true, "rating": 0 } ] }, "1094219575_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The flowers are blooming.\nCaption B: The flowers are wilting.", "gt-answer": "Caption A: The flowers are blooming.", "video-llm-prediction": "Caption B: The flowers are wilting.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The flowers are blooming.\nOption 2: The flowers are wilting.", "gt-answer": "Option 1: The flowers are blooming.", "video-llm-prediction": "Option 1: The flowers are blooming.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The flowers are wilting.\nSentence B: The flowers are blooming.", "gt-answer": "Sentence B: The flowers are blooming.", "video-llm-prediction": "Sentence B: The flowers are blooming.", "match_success": true, "rating": 1 } ] }, "1067427023_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The snow particles are melting.\nSentence B: The snow particles are solidifying.", "gt-answer": "Sentence B: The snow particles are solidifying.", "video-llm-prediction": "Sentence A: The snow particles are melting.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The snow particles are freezing.\nOption 2: The snow particles are melting.", "gt-answer": "Option 1: The snow particles are freezing.", "video-llm-prediction": "Option 2: The snow particles are melting.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The snow particles are freezing.\nCaption B: The snow particles are remaining the same.", "gt-answer": "Caption A: The snow particles are freezing.", "video-llm-prediction": "Caption A: The snow particles are freezing.", "match_success": true, "rating": 1 } ] }, "1093948229_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The golden particles are exploding.\nSentence B: The golden particles are disappearing.", "gt-answer": "Sentence B: The golden particles are disappearing.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The golden particles are exploding.\nOption 2: The golden particles are shrinking.", "gt-answer": "Option 2: The golden particles are shrinking.", "video-llm-prediction": "Option 1: The golden particles are exploding.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The golden particles are contracting.\nCaption B: The golden particles are exploding.", "gt-answer": "Caption A: The golden particles are contracting.", "video-llm-prediction": "Caption B: The golden particles are exploding.", "match_success": true, "rating": 0 } ] }, "1049965795_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The light bulb is turning off.\nSentence B: The light bulb is lighting up.", "gt-answer": "Sentence A: The light bulb is turning off.", "video-llm-prediction": "Sentence A: The light bulb is turning off.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The light bulb is breaking.\nCaption B: The light bulb is turning off.", "gt-answer": "Caption B: The light bulb is turning off.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The light bulb is rapidly changing color.\nOption 2: The light bulb is turning off.", "gt-answer": "Option 2: The light bulb is turning off.", "video-llm-prediction": "Option 1: The light bulb is rapidly changing color.", "match_success": true, "rating": 0 } ] }, "1052364490_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The digital bar chart is decreasing.\nSentence B: The digital bar chart is staying in the same size.", "gt-answer": "Sentence A: The digital bar chart is decreasing.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The digital bar chart is growing.\nCaption B: The digital bar chart is shrinking.", "gt-answer": "Caption B: The digital bar chart is shrinking.", "video-llm-prediction": "Caption B: The digital bar chart is shrinking.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The digital bar chart is decreasing.\nOption 2: The digital bar chart is growing.", "gt-answer": "Option 1: The digital bar chart is decreasing.", "video-llm-prediction": "Option 1: The digital bar chart is decreasing.", "match_success": true, "rating": 1 } ] }, "1080990179_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The apple is shrinking and drying out.\nCaption B: The apple is ripening.", "gt-answer": "Caption B: The apple is ripening.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The apple is shrinking and drying out.\nSentence B: The apple is growing bigger.", "gt-answer": "Sentence B: The apple is growing bigger.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The apple is becoming juicier.\nOption 2: The apple is shrinking and drying out.", "gt-answer": "Option 1: The apple is becoming juicier.", "video-llm-prediction": "Option 2: The apple is shrinking and drying out.", "match_success": true, "rating": 0 } ] }, "1077575504_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The pile of salt is shrinking.\nOption 2: The pile of salt is growing.", "gt-answer": "Option 1: The pile of salt is shrinking.", "video-llm-prediction": "Option 1: The pile of salt is shrinking.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The pile of salt is melting.\nSentence B: The pile of salt is shrinking.", "gt-answer": "Sentence B: The pile of salt is shrinking.", "video-llm-prediction": "Sentence B: The pile of salt is shrinking.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The pile of salt is growing.\nCaption B: The pile of salt is disappearing.", "gt-answer": "Caption B: The pile of salt is disappearing.", "video-llm-prediction": "Caption B: The pile of salt is disappearing.", "match_success": true, "rating": 1 } ] }, "23370985_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice crystal is melting.\nSentence B: The ice crystal is shattering.", "gt-answer": "Sentence A: The ice crystal is melting.", "video-llm-prediction": "Sentence B: The ice crystal is shattering.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The ice crystal is melting.\nCaption B: The ice crystal is forming.", "gt-answer": "Caption A: The ice crystal is melting.", "video-llm-prediction": "Caption B: The ice crystal is forming.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ice crystal is reducing in size.\nOption 2: The ice crystal is growing in size.", "gt-answer": "Option 1: The ice crystal is reducing in size.", "video-llm-prediction": "Option 1: The ice crystal is reducing in size.", "match_success": true, "rating": 1 } ] }, "1055981522_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The 3d shapes are transforming from cubes into spheres.\nCaption B: The 3d shapes are transforming from spheres into cubes.", "gt-answer": "Caption B: The 3d shapes are transforming from spheres into cubes.", "video-llm-prediction": "Caption A: The 3d shapes are transforming from cubes into spheres.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3d shapes are transforming from spheres into cubes.\nOption 2: The 3d shapes are transforming from cubes into spheres.", "gt-answer": "Option 1: The 3d shapes are transforming from spheres into cubes.", "video-llm-prediction": "Option 1: The 3d shapes are transforming from spheres into cubes.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3d shapes are transforming from cubes into spheres.\nSentence B: The 3d shapes are transforming from spheres into cubes.", "gt-answer": "Sentence B: The 3d shapes are transforming from spheres into cubes.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1081734740_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The leaf is turning from green to yellow.\nOption 2: The leaf is turning from yellow to green.", "gt-answer": "Option 2: The leaf is turning from yellow to green.", "video-llm-prediction": "Option 1: The leaf is turning from green to yellow.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The texture of the leaf is turning from green to yellow.\nCaption B: The leaf is turning from green to white.", "gt-answer": "Caption B: The leaf is turning from green to white.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The texture of the leaf is turning from yellow to green.\nSentence B: The texture of the leaf is turning from green to yellow.", "gt-answer": "Sentence A: The texture of the leaf is turning from yellow to green.", "video-llm-prediction": "Sentence A: The texture of the leaf is turning from yellow to green.", "match_success": true, "rating": 1 } ] }, "1093719871_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The pink flowers are turning from full blossom to withered.\nSentence B: The pink flowers are turning from withered to full blossom.", "gt-answer": "Sentence A: The pink flowers are turning from full blossom to withered.", "video-llm-prediction": "Sentence A: The pink flowers are turning from full blossom to withered.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pink flowers are growing taller.\nOption 2: The pink flowers are turning from full blossom to withered.", "gt-answer": "Option 2: The pink flowers are turning from full blossom to withered.", "video-llm-prediction": "Option 2: The pink flowers are turning from full blossom to withered.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The pink flowers are falling off petals.\nCaption B: The pink flowers are turning from full blossom to withered.", "gt-answer": "Caption B: The pink flowers are turning from full blossom to withered.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1055973887_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The fire ball is getting smaller.\nOption 2: The fire ball is getting larger.", "gt-answer": "Option 1: The fire ball is getting smaller.", "video-llm-prediction": "Option 2: The fire ball is getting larger.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The fire ball is shrinking in size.\nSentence B: The fire ball is getting larger.", "gt-answer": "Sentence A: The fire ball is shrinking in size.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The fire ball is getting larger.\nCaption B: The fire ball is getting smaller.", "gt-answer": "Caption B: The fire ball is getting smaller.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1098710341_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The glass is going from empty to full of water.\nOption 2: The glass is going from full of water to empty.", "gt-answer": "Option 2: The glass is going from full of water to empty.", "video-llm-prediction": "Option 1: The glass is going from empty to full of water.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The glass is going from full of water to empty.\nSentence B: The glass is going from empty to full of water.", "gt-answer": "Sentence A: The glass is going from full of water to empty.", "video-llm-prediction": "Sentence B: The glass is going from empty to full of water.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The glass is going from empty to full of water.\nCaption B: The glass is going from full of water to empty.", "gt-answer": "Caption B: The glass is going from full of water to empty.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1099116143_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: White foam appears on the surface of the pink liquid.\nCaption B: White foam disappears from the surface of the pink liquid.", "gt-answer": "Caption B: White foam disappears from the surface of the pink liquid.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pink liquid is freezing.\nOption 2: White foam disappears from the surface of the pink liquid.", "gt-answer": "Option 2: White foam disappears from the surface of the pink liquid.", "video-llm-prediction": "Option 2: White foam disappears from the surface of the pink liquid.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: White foam disappears from the surface of the pink liquid.\nSentence B: The pink liquid is evaporating.", "gt-answer": "Sentence A: White foam disappears from the surface of the pink liquid.", "video-llm-prediction": "Sentence B: The pink liquid is evaporating.", "match_success": true, "rating": 0 } ] }, "1025623079_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The skyscraper is growing taller.\nCaption B: The skyscraper is collapsing.", "gt-answer": "Caption A: The skyscraper is growing taller.", "video-llm-prediction": "Caption B: The skyscraper is collapsing.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The skyscraper is growing taller.\nOption 2: The skyscraper is collapsing.", "gt-answer": "Option 1: The skyscraper is growing taller.", "video-llm-prediction": "Option 2: The skyscraper is collapsing.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The skyscraper is standing up.\nSentence B: The skyscraper is collapsing.", "gt-answer": "Sentence A: The skyscraper is standing up.", "video-llm-prediction": "Sentence B: The skyscraper is collapsing.", "match_success": true, "rating": 0 } ] }, "1063373449_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The coronavirus is assembling together.\nOption 2: The coronavirus is decreasing in size.", "gt-answer": "Option 1: The coronavirus is assembling together.", "video-llm-prediction": "Option 2: The coronavirus is decreasing in size.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The coronavirus is dissolving under the attack of antibodies.\nSentence B: The coronavirus is assembling together.", "gt-answer": "Sentence B: The coronavirus is assembling together.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The coronavirus is dissolving under the attack of antibodies.\nCaption B: The coronavirus is assembling together.", "gt-answer": "Caption B: The coronavirus is assembling together.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1062609286_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The battery charge is decreasing.\nOption 2: The battery charge is increasing.", "gt-answer": "Option 1: The battery charge is decreasing.", "video-llm-prediction": "Option 1: The battery charge is decreasing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The battery charge is staying constant.\nCaption B: The battery charge is decreasing.", "gt-answer": "Caption B: The battery charge is decreasing.", "video-llm-prediction": "Caption B: The battery charge is decreasing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The battery charge is decreasing.\nSentence B: The battery charge is increasing.", "gt-answer": "Sentence A: The battery charge is decreasing.", "video-llm-prediction": "Sentence A: The battery charge is decreasing.", "match_success": true, "rating": 1 } ] }, "1060403198_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The tree is decreasing in height.\nSentence B: The tree is increasing in height.", "gt-answer": "Sentence A: The tree is decreasing in height.", "video-llm-prediction": "Sentence A: The tree is decreasing in height.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The tree is growing taller.\nCaption B: The tree is becoming shorter.", "gt-answer": "Caption B: The tree is becoming shorter.", "video-llm-prediction": "Caption A: The tree is growing taller.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The tree is decreasing in height.\nOption 2: The tree is increasing in height.", "gt-answer": "Option 1: The tree is decreasing in height.", "video-llm-prediction": "Option 1: The tree is decreasing in height.", "match_success": true, "rating": 1 } ] }, "1099109715_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The number of fruits and vegetables is increasing.\nOption 2: The number of fruits and vegetables is decreasing.", "gt-answer": "Option 2: The number of fruits and vegetables is decreasing.", "video-llm-prediction": "Option 1: The number of fruits and vegetables is increasing.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The number of fruits and vegetables is decreasing.\nSentence B: The fruits and vegetables are becoming rotten.", "gt-answer": "Sentence A: The number of fruits and vegetables is decreasing.", "video-llm-prediction": "Sentence A: The number of fruits and vegetables is decreasing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The number of fruits and vegetables is decreasing.\nCaption B: The fruits and vegetables are staying the same.", "gt-answer": "Caption A: The number of fruits and vegetables is decreasing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1051211272_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The toast with cream cheese is gradually growing larger.\nSentence B: The toast with cream cheese is gradually being eaten out and disappearing.", "gt-answer": "Sentence A: The toast with cream cheese is gradually growing larger.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The toast with cream cheese is gradually being eaten out and disappearing.\nOption 2: The toast with cream cheese is gradually emerging piece by piece.", "gt-answer": "Option 2: The toast with cream cheese is gradually emerging piece by piece.", "video-llm-prediction": "Option 1: The toast with cream cheese is gradually being eaten out and disappearing.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The toast with cream cheese is gradually growing larger.\nCaption B: The toast with cream cheese is gradually being eaten out and disappearing.", "gt-answer": "Caption A: The toast with cream cheese is gradually growing larger.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1059815936_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The paper is changing from a wrinkled paper ball into a flattened sheet.\nSentence B: The paper is changing from a flattened sheet into a wrinkled paper ball.", "gt-answer": "Sentence B: The paper is changing from a flattened sheet into a wrinkled paper ball.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The paper is changing from a wrinkled paper ball into a flattened sheet.\nCaption B: The paper is disappearing.", "gt-answer": "Caption B: The paper is disappearing.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The paper is changing from a flattened sheet into a wrinkled paper ball.\nOption 2: The paper is tearing apart.", "gt-answer": "Option 1: The paper is changing from a flattened sheet into a wrinkled paper ball.", "video-llm-prediction": "Option 1: The paper is changing from a flattened sheet into a wrinkled paper ball.", "match_success": true, "rating": 1 } ] }, "1059718130_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun above is rising at the same speed as the sun below.\nSentence B: The sun above is rising slower than the sun below.", "gt-answer": "Sentence A: The sun above is rising at the same speed as the sun below.", "video-llm-prediction": "Sentence A: The sun above is rising at the same speed as the sun below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The sun above is rising at the same speed as the sun below.\nCaption B: The sun below is rising faster than the sun above.", "gt-answer": "Caption A: The sun above is rising at the same speed as the sun below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun above is rising at the same speed as the sun below.\nOption 2: The sun above is not rising at the same speed as the sun below.", "gt-answer": "Option 1: The sun above is rising at the same speed as the sun below.", "video-llm-prediction": "Option 2: The sun above is not rising at the same speed as the sun below.", "match_success": true, "rating": 0 } ] }, "1059718130_concat_1": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The sun above is rising faster than the sun below.\nOption 2: The sun above is rising slower than the sun below.", "gt-answer": "Option 2: The sun above is rising slower than the sun below.", "video-llm-prediction": "Option 1: The sun above is rising faster than the sun below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: Both suns are rising at the same speed.\nCaption B: The sun above is rising slower than the sun below.", "gt-answer": "Caption B: The sun above is rising slower than the sun below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun below is rising at the same speed as the sun above.\nSentence B: The sun above is rising slower than the sun below.", "gt-answer": "Sentence B: The sun above is rising slower than the sun below.", "video-llm-prediction": "Sentence B: The sun above is rising slower than the sun below.", "match_success": true, "rating": 1 } ] }, "1059718130_concat_2": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The sun above is rising faster.\nSentence B: The sun above is rising at the same speed as the sun below.", "gt-answer": "Sentence A: The sun above is rising faster.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun above is rising faster.\nOption 2: The sun below is rising faster than the sun above.", "gt-answer": "Option 1: The sun above is rising faster.", "video-llm-prediction": "Option 2: The sun below is rising faster than the sun above.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The sun above is rising faster.\nCaption B: Both suns are rising at the same speed.", "gt-answer": "Caption A: The sun above is rising faster.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1098153561_concat_0": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The speed that the forest above changes color is faster than the forest below.\nCaption B: The speed that the forest above changes color is at the same speed as the forest below.", "gt-answer": "Caption B: The speed that the forest above changes color is at the same speed as the forest below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed that the forest above changes color is at the same speed as the forest below.\nOption 2: The speed that the forest above changes color is slower than the forest below.", "gt-answer": "Option 1: The speed that the forest above changes color is at the same speed as the forest below.", "video-llm-prediction": "Option 2: The speed that the forest above changes color is slower than the forest below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed that the forest above changes color is at the same speed as the forest below.\nSentence B: The speed that the forest above changes color is faster than the forest below.", "gt-answer": "Sentence A: The speed that the forest above changes color is at the same speed as the forest below.", "video-llm-prediction": "Sentence A: The speed that the forest above changes color is at the same speed as the forest below.", "match_success": true, "rating": 1 } ] }, "1098153561_concat_1": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The forest above changes color faster than the forest below.\nSentence B: The forest above changes color at a slower speed than the forest below.", "gt-answer": "Sentence B: The forest above changes color at a slower speed than the forest below.", "video-llm-prediction": "Sentence A: The forest above changes color faster than the forest below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The forest above changes color at the same speed as the forest below.\nCaption B: The forest above changes color at a slower speed than the forest below.", "gt-answer": "Caption B: The forest above changes color at a slower speed than the forest below.", "video-llm-prediction": "Caption A: The forest above changes color at the same speed as the forest below.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The forest above changes color at a slower speed than the forest below.\nOption 2: The forest above changes color at a faster speed than the forest below.", "gt-answer": "Option 1: The forest above changes color at a slower speed than the forest below.", "video-llm-prediction": "Option 2: The forest above changes color at a faster speed than the forest below.", "match_success": true, "rating": 0 } ] }, "1098153561_concat_2": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The forest above changes color faster than the forest below.\nOption 2: The forest above changes color at the same speed as the forest below.", "gt-answer": "Option 1: The forest above changes color faster than the forest below.", "video-llm-prediction": "Option 1: The forest above changes color faster than the forest below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The forest above changes color slower than the forest below.\nCaption B: The forest above changes color faster than the forest below.", "gt-answer": "Caption B: The forest above changes color faster than the forest below.", "video-llm-prediction": "Caption B: The forest above changes color faster than the forest below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The forest below changes color faster than the forest above.\nSentence B: The forest above changes color faster than the forest below.", "gt-answer": "Sentence B: The forest above changes color faster than the forest below.", "video-llm-prediction": "Sentence A: The forest below changes color faster than the forest above.", "match_success": true, "rating": 0 } ] }, "1059462749_concat_0": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The person above and the person below are moving at the same speed.\nCaption B: The person above is climbing faster than the person below.", "gt-answer": "Caption A: The person above and the person below are moving at the same speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person above and the person below are moving at the same speed.\nOption 2: The person above is climbing slower than the person below.", "gt-answer": "Option 1: The person above and the person below are moving at the same speed.", "video-llm-prediction": "Option 2: The person above is climbing slower than the person below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person above and the person below are moving at the same speed.\nSentence B: The person below is climbing faster than the person above.", "gt-answer": "Sentence A: The person above and the person below are moving at the same speed.", "video-llm-prediction": "Sentence B: The person below is climbing faster than the person above.", "match_success": true, "rating": 0 } ] }, "1059462749_concat_1": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The person above is climbing faster than the person below.\nCaption B: The person above is climbing slower than the person below.", "gt-answer": "Caption B: The person above is climbing slower than the person below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person above is climbing slower than the person below.\nSentence B: The person above and below are moving at the same speed.", "gt-answer": "Sentence A: The person above is climbing slower than the person below.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person above is climbing slower than the person below.\nOption 2: The person above is moving at the same speed as the person below.", "gt-answer": "Option 1: The person above is climbing slower than the person below.", "video-llm-prediction": "Option 1: The person above is climbing slower than the person below.", "match_success": true, "rating": 1 } ] }, "1059462749_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The person above is climbing faster than the person below.\nCaption B: The person above is climbing at the same speed as the person below.", "gt-answer": "Caption A: The person above is climbing faster than the person below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person above is climbing faster than the person below.\nSentence B: The person above is climbing slower than the person below.", "gt-answer": "Sentence A: The person above is climbing faster than the person below.", "video-llm-prediction": "Sentence A: The person above is climbing faster than the person below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person above is climbing faster than the person below.\nOption 2: The person below is moving faster than the person above.", "gt-answer": "Option 1: The person above is climbing faster than the person below.", "video-llm-prediction": "Option 2: The person below is moving faster than the person above.", "match_success": true, "rating": 0 } ] }, "1059072773_concat_0": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The ice cream above is melting at the same speed as the ice cream below.\nOption 2: The ice cream above is melting faster than the ice cream below.", "gt-answer": "Option 1: The ice cream above is melting at the same speed as the ice cream below.", "video-llm-prediction": "Option 2: The ice cream above is melting faster than the ice cream below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream above is melting at the same speed as the ice cream below.\nSentence B: The melting of the ice cream above is slower than the ice cream below.", "gt-answer": "Sentence A: The ice cream above is melting at the same speed as the ice cream below.", "video-llm-prediction": "Sentence A: The ice cream above is melting at the same speed as the ice cream below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The ice cream above is melting at the same speed as the ice cream below.\nCaption B: The melting of the ice cream above is not at the same speed as the ice cream below.", "gt-answer": "Caption A: The ice cream above is melting at the same speed as the ice cream below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1059072773_concat_1": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The ice cream above is melting faster than the ice cream below.\nCaption B: The ice cream above is melting slower than the ice cream below.", "gt-answer": "Caption B: The ice cream above is melting slower than the ice cream below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ice cream above is melting slower than the ice cream below.\nOption 2: The ice cream above is melting at the same speed as the ice cream below.", "gt-answer": "Option 1: The ice cream above is melting slower than the ice cream below.", "video-llm-prediction": "Option 1: The ice cream above is melting slower than the ice cream below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream above is melting slower than the ice cream below.\nSentence B: The ice cream above is melting faster than the ice cream below.", "gt-answer": "Sentence A: The ice cream above is melting slower than the ice cream below.", "video-llm-prediction": "Sentence A: The ice cream above is melting slower than the ice cream below.", "match_success": true, "rating": 1 } ] }, "1059072773_concat_2": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream above is melting at the same speed as the ice cream below.\nSentence B: The ice cream above is melting faster than the ice cream below.", "gt-answer": "Sentence B: The ice cream above is melting faster than the ice cream below.", "video-llm-prediction": "Sentence B: The ice cream above is melting faster than the ice cream below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ice cream above is melting faster than the ice cream below.\nOption 2: The ice cream above is melting slower than the ice cream below.", "gt-answer": "Option 1: The ice cream above is melting faster than the ice cream below.", "video-llm-prediction": "Option 1: The ice cream above is melting faster than the ice cream below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The ice cream above is melting faster than the ice cream below.\nCaption B: The ice cream above is melting slower than the ice cream below.", "gt-answer": "Caption A: The ice cream above is melting faster than the ice cream below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1090578917_concat_0": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The man above is jumping slower than the man below.\nCaption B: The man above is jumping at the same speed as the man below.", "gt-answer": "Caption B: The man above is jumping at the same speed as the man below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man above is jumping at the same speed as the man below.\nSentence B: The man above is jumping faster than the man below.", "gt-answer": "Sentence A: The man above is jumping at the same speed as the man below.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In comparison to the man below, the speed of the man above jumping looks faster.\nOption 2: The man above is jumping at the same speed as the man below.", "gt-answer": "Option 2: The man above is jumping at the same speed as the man below.", "video-llm-prediction": "Option 1: In comparison to the man below, the speed of the man above jumping looks faster.", "match_success": true, "rating": 0 } ] }, "1090578917_concat_1": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man above is jumping at a slower speed than the man below.\nOption 2: The man above is jumping at the same speed as the man below.", "gt-answer": "Option 1: The man above is jumping at a slower speed than the man below.", "video-llm-prediction": "Option 1: The man above is jumping at a slower speed than the man below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man above is jumping at a faster speed than the man below.\nSentence B: The man above is jumping at a slower speed than the man below.", "gt-answer": "Sentence B: The man above is jumping at a slower speed than the man below.", "video-llm-prediction": "Sentence A: The man above is jumping at a faster speed than the man below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The man above is jumping at a slower speed than the man below.\nCaption B: The man above is jumping at a faster speed than the man below.", "gt-answer": "Caption A: The man above is jumping at a slower speed than the man below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1090578917_concat_2": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man above is jumping faster than the man below.\nSentence B: The man above is jumping at the same speed as the man below.", "gt-answer": "Sentence A: The man above is jumping faster than the man below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man above is jumping faster than the man below.\nCaption B: The man above is jumping slower than the man below.", "gt-answer": "Caption A: The man above is jumping faster than the man below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the man above jumping looks slower.\nOption 2: The man above is jumping faster than the man below.", "gt-answer": "Option 2: The man above is jumping faster than the man below.", "video-llm-prediction": "Option 2: The man above is jumping faster than the man below.", "match_success": true, "rating": 1 } ] }, "1075338140_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ball above is faster than the ball below.\nSentence B: The speed of the ball above is the same as the ball below.", "gt-answer": "Sentence B: The speed of the ball above is the same as the ball below.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the ball above is the same as the ball below.\nCaption B: The ball below is slower than the ball above.", "gt-answer": "Caption A: The speed of the ball above is the same as the ball below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the ball above is the same as the ball below.\nOption 2: Both balls are moving at different speeds.", "gt-answer": "Option 1: The speed of the ball above is the same as the ball below.", "video-llm-prediction": "Option 2: Both balls are moving at different speeds.", "match_success": true, "rating": 0 } ] }, "1075338140_concat_1": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The ball above is moving slower than the ball below.\nCaption B: The ball above is moving faster than the ball below.", "gt-answer": "Caption A: The ball above is moving slower than the ball below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The ball above is moving slower than the ball below.\nOption 2: Both balls are moving at the same speed.", "gt-answer": "Option 1: The ball above is moving slower than the ball below.", "video-llm-prediction": "Option 1: The ball above is moving slower than the ball below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ball above is moving slower than the ball below.\nSentence B: The ball below is moving slower.", "gt-answer": "Sentence A: The ball above is moving slower than the ball below.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 } ] }, "1075338140_concat_2": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The ball above is moving at the same speed as the ball below.\nOption 2: The ball above is moving faster.", "gt-answer": "Option 2: The ball above is moving faster.", "video-llm-prediction": "Option 1: The ball above is moving at the same speed as the ball below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ball below is moving faster.\nSentence B: The ball above is moving faster.", "gt-answer": "Sentence B: The ball above is moving faster.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The ball above is moving slower than the ball below.\nCaption B: The ball above is moving faster.", "gt-answer": "Caption B: The ball above is moving faster.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1077575504_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the pile of salt above is growing at the same speed as the pile of salt below.\nSentence B: The pile of salt above is growing at a faster speed than the pile of salt below.", "gt-answer": "Sentence A: The speed of the pile of salt above is growing at the same speed as the pile of salt below.", "video-llm-prediction": "Sentence B: The pile of salt above is growing at a faster speed than the pile of salt below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the pile of salt above is growing at the same speed as the pile of salt below.\nCaption B: The pile of salt above is growing at a slower speed than the pile of salt below.", "gt-answer": "Caption A: The speed of the pile of salt above is growing at the same speed as the pile of salt below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pile of salt above is growing at a slower speed than the pile of salt below.\nOption 2: The speed of the pile of salt above is growing at the same speed as the pile of salt below.", "gt-answer": "Option 2: The speed of the pile of salt above is growing at the same speed as the pile of salt below.", "video-llm-prediction": "Option 1: The pile of salt above is growing at a slower speed than the pile of salt below.", "match_success": true, "rating": 0 } ] }, "1077575504_concat_1": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The pile of salt above is growing at a slower speed than the pile of salt below.\nSentence B: The pile of salt above is growing at a faster speed than the pile of salt below.", "gt-answer": "Sentence A: The pile of salt above is growing at a slower speed than the pile of salt below.", "video-llm-prediction": "Sentence A: The pile of salt above is growing at a slower speed than the pile of salt below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The pile of salt above is growing at a slower speed than the pile of salt below.\nCaption B: The pile of salt above is growing at the same speed as the pile of salt below.", "gt-answer": "Caption A: The pile of salt above is growing at a slower speed than the pile of salt below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pile of salt below is growing slower than the pile of salt above.\nOption 2: The pile of salt above is growing at a slower speed than the pile of salt below.", "gt-answer": "Option 2: The pile of salt above is growing at a slower speed than the pile of salt below.", "video-llm-prediction": "Option 2: The pile of salt above is growing at a slower speed than the pile of salt below.", "match_success": true, "rating": 1 } ] }, "1077575504_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The pile of salt above is growing at a faster speed than the pile of salt below.\nCaption B: The pile of salt above is growing at the same speed as the pile of salt below.", "gt-answer": "Caption A: The pile of salt above is growing at a faster speed than the pile of salt below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pile of salt above is growing at a faster speed than the pile of salt below.\nOption 2: The pile of salt above is growing at a slower speed than the pile of salt below.", "gt-answer": "Option 1: The pile of salt above is growing at a faster speed than the pile of salt below.", "video-llm-prediction": "Option 1: The pile of salt above is growing at a faster speed than the pile of salt below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The pile of salt above is growing at a slower speed than the pile of salt below.\nSentence B: The pile of salt above is growing at a faster speed than the pile of salt below.", "gt-answer": "Sentence B: The pile of salt above is growing at a faster speed than the pile of salt below.", "video-llm-prediction": "Sentence A: The pile of salt above is growing at a slower speed than the pile of salt below.", "match_success": true, "rating": 0 } ] }, "1100319395_concat_0": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The white circle above is rotating at the same speed as the white circle below.\nOption 2: The white circle above is rotating faster than the white circle below.", "gt-answer": "Option 1: The white circle above is rotating at the same speed as the white circle below.", "video-llm-prediction": "Option 1: The white circle above is rotating at the same speed as the white circle below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The white circle above is rotating at the same speed as the white circle below.\nCaption B: The white circle above is rotating slower than the white circle below.", "gt-answer": "Caption A: The white circle above is rotating at the same speed as the white circle below.", "video-llm-prediction": "Caption B: The white circle above is rotating slower than the white circle below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The white circle above is rotating at the same speed as the white circle below.\nSentence B: The white circle above is rotating faster than the white circle below.", "gt-answer": "Sentence A: The white circle above is rotating at the same speed as the white circle below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1100319395_concat_1": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The white circle above is rotating faster than the white circle below.\nOption 2: The white circle above is rotating at the same speed as the white circle below.", "gt-answer": "Option 1: The white circle above is rotating faster than the white circle below.", "video-llm-prediction": "Option 1: The white circle above is rotating faster than the white circle below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The white circle above is rotating faster than the white circle below.\nCaption B: The white circle above is rotating slower than the white circle below.", "gt-answer": "Caption A: The white circle above is rotating faster than the white circle below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The white circle above is rotating slower than the white circle below.\nSentence B: The white circle above is rotating faster than the white circle below.", "gt-answer": "Sentence B: The white circle above is rotating faster than the white circle below.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1100319395_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The white circle above is rotating at a slower speed than the white circle below.\nCaption B: The white circle above is rotating at the same speed as the white circle below.", "gt-answer": "Caption A: The white circle above is rotating at a slower speed than the white circle below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The white circle above is rotating at a slower speed than the white circle below.\nSentence B: The white circle above is rotating faster than the white circle below.", "gt-answer": "Sentence A: The white circle above is rotating at a slower speed than the white circle below.", "video-llm-prediction": "Sentence B: The white circle above is rotating faster than the white circle below.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The white circle above is rotating at a slower speed than the white circle below.\nOption 2: The white circle above is rotating faster than the white circle below.", "gt-answer": "Option 1: The white circle above is rotating at a slower speed than the white circle below.", "video-llm-prediction": "Option 2: The white circle above is rotating faster than the white circle below.", "match_success": true, "rating": 0 } ] }, "1086820415_concat_0": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the wave above is the same as the wave below.\nOption 2: The wave above is moving faster than the wave below.", "gt-answer": "Option 1: The speed of the wave above is the same as the wave below.", "video-llm-prediction": "Option 2: The wave above is moving faster than the wave below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the wave above is the same as the wave below.\nSentence B: The wave above is moving slower than the wave below.", "gt-answer": "Sentence A: The speed of the wave above is the same as the wave below.", "video-llm-prediction": "Sentence A: The speed of the wave above is the same as the wave below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The wave below is moving faster.\nCaption B: The speed of the wave above is the same as the wave below.", "gt-answer": "Caption B: The speed of the wave above is the same as the wave below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1086820415_concat_1": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The speed of the wave above is slower than the wave below.\nCaption B: The speed of the wave above is faster than the wave below.", "gt-answer": "Caption B: The speed of the wave above is faster than the wave below.", "video-llm-prediction": "Caption B: The speed of the wave above is faster than the wave below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the wave above is faster than the wave below.\nOption 2: Both waves are moving at the same speed.", "gt-answer": "Option 1: The speed of the wave above is faster than the wave below.", "video-llm-prediction": "Option 1: The speed of the wave above is faster than the wave below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the wave above is faster than the wave below.\nSentence B: The wave below is moving faster than the wave above.", "gt-answer": "Sentence A: The speed of the wave above is faster than the wave below.", "video-llm-prediction": "Sentence B: The wave below is moving faster than the wave above.", "match_success": true, "rating": 0 } ] }, "1086820415_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The wave above is moving at the same speed as the wave below.\nCaption B: The wave above is moving slower than the wave below.", "gt-answer": "Caption B: The wave above is moving slower than the wave below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Both waves are moving at the same speed.\nOption 2: The wave above is moving slower than the wave below.", "gt-answer": "Option 2: The wave above is moving slower than the wave below.", "video-llm-prediction": "Option 2: The wave above is moving slower than the wave below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The wave below is moving faster than the wave above.\nSentence B: The wave above is moving slower than the wave below.", "gt-answer": "Sentence B: The wave above is moving slower than the wave below.", "video-llm-prediction": "Sentence B: The wave above is moving slower than the wave below.", "match_success": true, "rating": 1 } ] }, "1096238125_concat_0": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The two people above are lifting the kettlebell slower than the two people below.\nCaption B: The two people above are lifting the kettlebell at the same speed as the two people below.", "gt-answer": "Caption B: The two people above are lifting the kettlebell at the same speed as the two people below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The two people above are lifting the kettlebell at the same speed as the two people below.\nOption 2: The two people above are lifting the kettlebell faster than the two people below.", "gt-answer": "Option 1: The two people above are lifting the kettlebell at the same speed as the two people below.", "video-llm-prediction": "Option 2: The two people above are lifting the kettlebell faster than the two people below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The two people above are lifting the kettlebell at the same speed as the two people below.\nSentence B: The two people above are lifting the kettlebell faster than the two people below.", "gt-answer": "Sentence A: The two people above are lifting the kettlebell at the same speed as the two people below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1096238125_concat_1": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The two people above are lifting the kettlebell slower than the two people below.\nOption 2: The two people above are lifting the kettlebell faster than the two people below.", "gt-answer": "Option 2: The two people above are lifting the kettlebell faster than the two people below.", "video-llm-prediction": "Option 2: The two people above are lifting the kettlebell faster than the two people below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The two people above are lifting the kettlebell faster than the two people below.\nCaption B: The two people above are lifting the kettlebell at the same speed as the two people below.", "gt-answer": "Caption A: The two people above are lifting the kettlebell faster than the two people below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The two people above are lifting the kettlebell slower than the two people below.\nSentence B: The two people above are lifting the kettlebell faster than the two people below.", "gt-answer": "Sentence B: The two people above are lifting the kettlebell faster than the two people below.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1096238125_concat_2": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The two people above are lifting the kettlebell slower than the two people below.\nOption 2: The two people above are lifting the kettlebell at the same speed as the two people below.", "gt-answer": "Option 1: The two people above are lifting the kettlebell slower than the two people below.", "video-llm-prediction": "Option 1: The two people above are lifting the kettlebell slower than the two people below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The two people above are lifting the kettlebell faster than the two people below.\nCaption B: The two people above are lifting the kettlebell slower than the two people below.", "gt-answer": "Caption B: The two people above are lifting the kettlebell slower than the two people below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The two people above are lifting the kettlebell slower than the two people below.\nSentence B: The two people above are lifting the kettlebell faster than the two people below.", "gt-answer": "Sentence A: The two people above are lifting the kettlebell slower than the two people below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1056433484_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the earth above is the same as the speed of the earth below.\nSentence B: The speed of the earth above is slower than the earth below.", "gt-answer": "Sentence A: The speed of the earth above is the same as the speed of the earth below.", "video-llm-prediction": "Sentence B: The speed of the earth above is slower than the earth below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the earth above is the same as the speed of the earth below.\nCaption B: The speed of the earth above is faster than the earth below.", "gt-answer": "Caption A: The speed of the earth above is the same as the speed of the earth below.", "video-llm-prediction": "Caption A: The speed of the earth above is the same as the speed of the earth below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the earth above is the same as the speed of the earth below.\nOption 2: The speed of the earth above is different from the earth below.", "gt-answer": "Option 1: The speed of the earth above is the same as the speed of the earth below.", "video-llm-prediction": "Option 1: The speed of the earth above is the same as the speed of the earth below.", "match_success": true, "rating": 1 } ] }, "1056433484_concat_1": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The speed of the earth above is slower than the earth below.\nSentence B: The speed of the earth above is faster than the earth below.", "gt-answer": "Sentence A: The speed of the earth above is slower than the earth below.", "video-llm-prediction": "Sentence A: The speed of the earth above is slower than the earth below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the earth above is slower than the earth below.\nCaption B: The speed of the earth above is the same as the earth below.", "gt-answer": "Caption A: The speed of the earth above is slower than the earth below.", "video-llm-prediction": "Caption A: The speed of the earth above is slower than the earth below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the earth above is slower than the earth below.\nOption 2: The speed of the earth above is faster than the earth below.", "gt-answer": "Option 1: The speed of the earth above is slower than the earth below.", "video-llm-prediction": "Option 2: The speed of the earth above is faster than the earth below.", "match_success": true, "rating": 0 } ] }, "1056433484_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The speed of the earth above is slower than the earth below.\nCaption B: The speed of the earth above is faster than the earth below.", "gt-answer": "Caption B: The speed of the earth above is faster than the earth below.", "video-llm-prediction": "Caption A: The speed of the earth above is slower than the earth below.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the earth above is the same as the earth below.\nOption 2: The speed of the earth above is faster than the earth below.", "gt-answer": "Option 2: The speed of the earth above is faster than the earth below.", "video-llm-prediction": "Option 2: The speed of the earth above is faster than the earth below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The earth above rotates at the same speed as the earth below.\nSentence B: The speed of the earth above is faster than the earth below.", "gt-answer": "Sentence B: The speed of the earth above is faster than the earth below.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "15695290_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person above draws a picture more slowly than the person below.\nSentence B: The person above draws a picture at the same speed as the person below.", "gt-answer": "Sentence B: The person above draws a picture at the same speed as the person below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person above draws a picture more rapidly than the person below.\nOption 2: The person above draws a picture at the same speed as the person below.", "gt-answer": "Option 2: The person above draws a picture at the same speed as the person below.", "video-llm-prediction": "Option 1: The person above draws a picture more rapidly than the person below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person above draws a picture more rapidly than the person below.\nCaption B: The person above draws a picture at the same speed as the person below.", "gt-answer": "Caption B: The person above draws a picture at the same speed as the person below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "15695290_concat_1": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The person above draws a picture at an equal speed as the person below.\nCaption B: The person above draws a picture more slowly than the person below.", "gt-answer": "Caption B: The person above draws a picture more slowly than the person below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person above draws a picture more slowly than the person below.\nSentence B: The person above draws a picture more rapidly than the person below.", "gt-answer": "Sentence A: The person above draws a picture more slowly than the person below.", "video-llm-prediction": "Sentence B: The person above draws a picture more rapidly than the person below.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person above draws a picture more slowly than the person below.\nOption 2: The person above draws a picture faster than the person below.", "gt-answer": "Option 1: The person above draws a picture more slowly than the person below.", "video-llm-prediction": "Option 2: The person above draws a picture faster than the person below.", "match_success": true, "rating": 0 } ] }, "15695290_concat_2": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The person above is drawing a picture slower than the person below.\nSentence B: The person above is drawing a picture faster than the person below.", "gt-answer": "Sentence B: The person above is drawing a picture faster than the person below.", "video-llm-prediction": "Sentence B: The person above is drawing a picture faster than the person below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person above is drawing a picture at the same speed as the person below.\nOption 2: The person above is drawing a picture faster than the person below.", "gt-answer": "Option 2: The person above is drawing a picture faster than the person below.", "video-llm-prediction": "Option 1: The person above is drawing a picture at the same speed as the person below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The person above is drawing a picture faster than the person below.\nCaption B: The person above is drawing a picture more slowly than the person below.", "gt-answer": "Caption A: The person above is drawing a picture faster than the person below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1047368344_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl above is running slower than the girl below.\nSentence B: The girl above is running at the same speed as the girl below.", "gt-answer": "Sentence B: The girl above is running at the same speed as the girl below.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The girl above is running faster than the girl below.\nOption 2: The girl above is running at the same speed as the girl below.", "gt-answer": "Option 2: The girl above is running at the same speed as the girl below.", "video-llm-prediction": "Option 1: The girl above is running faster than the girl below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The girl above is running at the same speed as the girl below.\nCaption B: The speed of the girl above is different from the girl below.", "gt-answer": "Caption A: The girl above is running at the same speed as the girl below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1047368344_concat_1": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl above is running slower than the girl below.\nSentence B: The girl above is running at the same speed as the girl below.", "gt-answer": "Sentence A: The girl above is running slower than the girl below.", "video-llm-prediction": "Sentence A: The girl above is running slower than the girl below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The girl above is running faster than the girl below.\nOption 2: The girl above is running slower than the girl below.", "gt-answer": "Option 2: The girl above is running slower than the girl below.", "video-llm-prediction": "Option 1: The girl above is running faster than the girl below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The girl above is running faster than the girl below.\nCaption B: The girl above is running slower than the girl below.", "gt-answer": "Caption B: The girl above is running slower than the girl below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1047368344_concat_2": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl above is running faster than the girl below.\nSentence B: The girl above is running at the same speed as the girl below.", "gt-answer": "Sentence A: The girl above is running faster than the girl below.", "video-llm-prediction": "Sentence A: The girl above is running faster than the girl below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The girl above is running faster than the girl below.\nOption 2: The girl above is running slower than the girl below.", "gt-answer": "Option 1: The girl above is running faster than the girl below.", "video-llm-prediction": "Option 1: The girl above is running faster than the girl below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the girl above is slower than the girl below.\nCaption B: The girl above is running faster than the girl below.", "gt-answer": "Caption B: The girl above is running faster than the girl below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1060403198_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The tree above is growing slower than the tree below.\nSentence B: The tree above is growing at the same speed as the tree below.", "gt-answer": "Sentence B: The tree above is growing at the same speed as the tree below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The tree above is growing faster than the tree below.\nCaption B: The tree above is growing at the same speed as the tree below.", "gt-answer": "Caption B: The tree above is growing at the same speed as the tree below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The tree above is growing at the same speed as the tree below.\nOption 2: The tree above is growing faster than the tree below.", "gt-answer": "Option 1: The tree above is growing at the same speed as the tree below.", "video-llm-prediction": "Option 2: The tree above is growing faster than the tree below.", "match_success": true, "rating": 0 } ] }, "1060403198_concat_1": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The tree above is growing at the same speed as the tree below.\nOption 2: The tree above is growing faster than the tree below.", "gt-answer": "Option 2: The tree above is growing faster than the tree below.", "video-llm-prediction": "Option 2: The tree above is growing faster than the tree below.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The tree above is growing slower than the tree below.\nCaption B: The tree above is growing faster than the tree below.", "gt-answer": "Caption B: The tree above is growing faster than the tree below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The tree above is growing slower than the tree below.\nSentence B: The tree above is growing faster than the tree below.", "gt-answer": "Sentence B: The tree above is growing faster than the tree below.", "video-llm-prediction": "Sentence A: The tree above is growing slower than the tree below.", "match_success": true, "rating": 0 } ] }, "1060403198_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The tree above is growing at the same speed as the tree below.\nCaption B: The tree above is growing slower than the tree below.", "gt-answer": "Caption B: The tree above is growing slower than the tree below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The tree above is growing slower than the tree below.\nOption 2: The tree above is growing faster than the tree below.", "gt-answer": "Option 1: The tree above is growing slower than the tree below.", "video-llm-prediction": "Option 2: The tree above is growing faster than the tree below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The tree above is growing faster than the tree below.\nSentence B: The tree above is growing slower than the tree below.", "gt-answer": "Sentence B: The tree above is growing slower than the tree below.", "video-llm-prediction": "Sentence A: The tree above is growing faster than the tree below.", "match_success": true, "rating": 0 } ] }, "1100058499_concat_0": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The man above is jumping rope faster than the man below.\nCaption B: The man above and the man below are jumping rope at the same speed.", "gt-answer": "Caption B: The man above and the man below are jumping rope at the same speed.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man above and the man below are jumping rope at the same speed.\nOption 2: The man above is jumping rope slower than the man below.", "gt-answer": "Option 1: The man above and the man below are jumping rope at the same speed.", "video-llm-prediction": "Option 1: The man above and the man below are jumping rope at the same speed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man above is jumping rope faster than the man below.\nSentence B: The man above and the man below are jumping rope at the same speed.", "gt-answer": "Sentence B: The man above and the man below are jumping rope at the same speed.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1100058499_concat_1": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The man above is jumping rope faster than the man below.\nCaption B: The man above is jumping rope slower than the man below.", "gt-answer": "Caption B: The man above is jumping rope slower than the man below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man above is jumping rope slower than the man below.\nSentence B: The man above and the man below are jumping rope at the same speed.", "gt-answer": "Sentence A: The man above is jumping rope slower than the man below.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man below is jumping rope slower than the man above.\nOption 2: The man above is jumping rope slower than the man below.", "gt-answer": "Option 2: The man above is jumping rope slower than the man below.", "video-llm-prediction": "Option 2: The man above is jumping rope slower than the man below.", "match_success": true, "rating": 1 } ] }, "1100058499_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The man above is jumping rope at the same speed as the man below.\nCaption B: The man above is jumping rope faster than the man below.", "gt-answer": "Caption B: The man above is jumping rope faster than the man below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man above is jumping rope faster than the man below.\nSentence B: The man above is jumping rope slower than the man below.", "gt-answer": "Sentence A: The man above is jumping rope faster than the man below.", "video-llm-prediction": "Sentence A: The man above is jumping rope faster than the man below.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man below is jumping rope faster than the man above.\nOption 2: The man above is jumping rope faster than the man below.", "gt-answer": "Option 2: The man above is jumping rope faster than the man below.", "video-llm-prediction": "Option 2: The man above is jumping rope faster than the man below.", "match_success": true, "rating": 1 } ] }, "1092813279_concat_0": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman below is doing push ups slower.\nOption 2: The two women are doing push ups at the same speed.", "gt-answer": "Option 2: The two women are doing push ups at the same speed.", "video-llm-prediction": "Option 2: The two women are doing push ups at the same speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman above is doing push ups slower.\nCaption B: The two women are doing push ups at the same speed.", "gt-answer": "Caption B: The two women are doing push ups at the same speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman below is doing push ups faster.\nSentence B: The two women are doing push ups at the same speed.", "gt-answer": "Sentence B: The two women are doing push ups at the same speed.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1092813279_concat_1": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman below is doing push ups slower.\nSentence B: The woman above is doing push ups slower.", "gt-answer": "Sentence B: The woman above is doing push ups slower.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: Two women doing push ups at the same speed.\nCaption B: The woman above is doing push ups slower.", "gt-answer": "Caption B: The woman above is doing push ups slower.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman above is doing push ups faster.\nOption 2: The woman above is doing push ups slower.", "gt-answer": "Option 2: The woman above is doing push ups slower.", "video-llm-prediction": "Option 2: The woman above is doing push ups slower.", "match_success": true, "rating": 1 } ] }, "1092813279_concat_2": { "speed": [ { "question": "Which caption matches the video better?\nCaption A: The woman above is doing push ups slower.\nCaption B: The woman below is doing push ups slower.", "gt-answer": "Caption B: The woman below is doing push ups slower.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman below is doing push ups slower.\nSentence B: Two women doing push ups at the same speed.", "gt-answer": "Sentence A: The woman below is doing push ups slower.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed of the woman above's push ups is the same as the woman below.\nOption 2: The woman below is doing push ups slower.", "gt-answer": "Option 2: The woman below is doing push ups slower.", "video-llm-prediction": "Option 2: The woman below is doing push ups slower.", "match_success": true, "rating": 1 } ] }, "1084518106_concat_0": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The truck above is driving at the same speed as the truck below.\nOption 2: The truck above is driving slower than the truck below.", "gt-answer": "Option 1: The truck above is driving at the same speed as the truck below.", "video-llm-prediction": "Option 2: The truck above is driving slower than the truck below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The truck above is driving faster than the truck below.\nSentence B: The truck above is driving at the same speed as the truck below.", "gt-answer": "Sentence B: The truck above is driving at the same speed as the truck below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The speed of the truck below is slower than the speed of the truck above.\nCaption B: The truck above is driving at the same speed as the truck below.", "gt-answer": "Caption B: The truck above is driving at the same speed as the truck below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1084518106_concat_1": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The truck above is driving slower than the truck below.\nOption 2: The truck above is driving faster than the truck below.", "gt-answer": "Option 2: The truck above is driving faster than the truck below.", "video-llm-prediction": "Option 1: The truck above is driving slower than the truck below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The truck above is driving faster than the truck below.\nSentence B: Both trucks are driving at the same speed.", "gt-answer": "Sentence A: The truck above is driving faster than the truck below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The truck above is driving faster than the truck below.\nCaption B: The truck above is driving slower than the truck below.", "gt-answer": "Caption A: The truck above is driving faster than the truck below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1084518106_concat_2": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The truck above is driving faster than the truck below.\nOption 2: The truck above is driving slower than the truck below.", "gt-answer": "Option 2: The truck above is driving slower than the truck below.", "video-llm-prediction": "Option 1: The truck above is driving faster than the truck below.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The truck above is driving slower than the truck below.\nSentence B: Both trucks are driving at the same speed.", "gt-answer": "Sentence A: The truck above is driving slower than the truck below.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The truck above is driving faster than the truck below.\nCaption B: The truck above is driving slower than the truck below.", "gt-answer": "Caption B: The truck above is driving slower than the truck below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1062609286_concat_0": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The battery charge above is increasing at a slower speed than the battery charge below.\nSentence B: The battery charge above is increasing at the same speed as the battery charge below.", "gt-answer": "Sentence B: The battery charge above is increasing at the same speed as the battery charge below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The battery charge above is increasing at the same speed as the battery charge below.\nOption 2: The battery charge above is increasing at a faster speed than the battery charge below.", "gt-answer": "Option 1: The battery charge above is increasing at the same speed as the battery charge below.", "video-llm-prediction": "Option 2: The battery charge above is increasing at a faster speed than the battery charge below.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The battery charge above is increasing at the same speed as the battery charge below.\nCaption B: The battery charge above is increasing at a slower speed than the battery charge below.", "gt-answer": "Caption A: The battery charge above is increasing at the same speed as the battery charge below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1062609286_concat_1": { "speed": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The battery charge above is increasing at a slower speed than the battery charge below.\nSentence B: The battery charge above is increasing at a faster speed than the battery charge below.", "gt-answer": "Sentence A: The battery charge above is increasing at a slower speed than the battery charge below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The battery charge above is increasing at the same speed as the battery charge below.\nCaption B: The battery charge above is increasing at a slower speed than the battery charge below.", "gt-answer": "Caption B: The battery charge above is increasing at a slower speed than the battery charge below.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The speed at which the battery charge above is increasing is faster than the battery charge below.\nOption 2: The battery charge above is increasing at a slower speed than the battery charge below.", "gt-answer": "Option 2: The battery charge above is increasing at a slower speed than the battery charge below.", "video-llm-prediction": "Option 2: The battery charge above is increasing at a slower speed than the battery charge below.", "match_success": true, "rating": 1 } ] }, "1062609286_concat_2": { "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The battery charge above is increasing at a faster speed than the battery charge below.\nOption 2: The battery charge above is increasing at a slower speed than the battery charge below.", "gt-answer": "Option 1: The battery charge above is increasing at a faster speed than the battery charge below.", "video-llm-prediction": "Option 1: The battery charge above is increasing at a faster speed than the battery charge below.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The battery charge above is increasing at a faster speed than the battery charge below.\nSentence B: The battery charge above is increasing at the same speed as the battery charge below.", "gt-answer": "Sentence A: The battery charge above is increasing at a faster speed than the battery charge below.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The battery charge above is increasing at a slower speed than the battery charge below.\nCaption B: The battery charge above is increasing at a faster speed than the battery charge below.", "gt-answer": "Caption B: The battery charge above is increasing at a faster speed than the battery charge below.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1111601171_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The sphere building is changing from blue to green.\nOption 2: The sphere building is changing from blue to red.", "gt-answer": "Option 1: The sphere building is changing from blue to green.", "video-llm-prediction": "Option 1: The sphere building is changing from blue to green.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The sphere building is changing from green to blue.\nCaption B: The sphere building is changing from blue to green.", "gt-answer": "Caption B: The sphere building is changing from blue to green.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sphere building is staying in the same color.\nSentence B: The sphere building is changing from blue to green.", "gt-answer": "Sentence B: The sphere building is changing from blue to green.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1086105089_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The building is demolishing.\nCaption B: The building is being constructed.", "gt-answer": "Caption A: The building is demolishing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The building is demolishing.\nOption 2: The building is growing wider.", "gt-answer": "Option 1: The building is demolishing.", "video-llm-prediction": "Option 2: The building is growing wider.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The building is staying the same.\nSentence B: The building is demolishing.", "gt-answer": "Sentence B: The building is demolishing.", "video-llm-prediction": "Sentence B: The building is demolishing.", "match_success": true, "rating": 1 } ] }, "1058498242_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D pixels are changing from a cuboid into the shape of a man.\nSentence B: The 3D pixels are changing from the shape of a man into a cuboid.", "gt-answer": "Sentence B: The 3D pixels are changing from the shape of a man into a cuboid.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The 3D pixels are changing from the shape of a man into a cuboid.\nCaption B: The 3D pixels are changing from a cuboid into a the shape of a man.", "gt-answer": "Caption A: The 3D pixels are changing from the shape of a man into a cuboid.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3D pixels are changing from the shape of a man into a cuboid.\nOption 2: The 3D pixels are changing from a sphere into a cuboid.", "gt-answer": "Option 1: The 3D pixels are changing from the shape of a man into a cuboid.", "video-llm-prediction": "Option 1: The 3D pixels are changing from the shape of a man into a cuboid.", "match_success": true, "rating": 1 } ] }, "1082268005_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The planet earth is disassembling and disappearing.\nCaption B: The planet earth is assembling from toy bricks.", "gt-answer": "Caption A: The planet earth is disassembling and disappearing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The planet earth is splitting into two halves.\nOption 2: The planet earth is disassembling and disappearing.", "gt-answer": "Option 2: The planet earth is disassembling and disappearing.", "video-llm-prediction": "Option 2: The planet earth is disassembling and disappearing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The planet earth is disassembling and disappearing.\nSentence B: The planet earth is assembling from toy bricks.", "gt-answer": "Sentence A: The planet earth is disassembling and disappearing.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 } ] }, "1070711428_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The glacier is assembling and rising from the water.\nSentence B: The glacier is breaking and falling in the water.", "gt-answer": "Sentence A: The glacier is assembling and rising from the water.", "video-llm-prediction": "Sentence A: The glacier is assembling and rising from the water.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The glacier is assembling and rising from the water.\nCaption B: The glacier is breaking and falling in the water.", "gt-answer": "Caption A: The glacier is assembling and rising from the water.", "video-llm-prediction": "Caption A: The glacier is assembling and rising from the water.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The glacier is evaporating.\nOption 2: The glacier is assembling and rising from the water.", "gt-answer": "Option 2: The glacier is assembling and rising from the water.", "video-llm-prediction": "Option 2: The glacier is assembling and rising from the water.", "match_success": true, "rating": 1 } ] }, "1057447372_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The sport stadium is turning darker.\nCaption B: The sport stadium is staying the same brightness.", "gt-answer": "Caption A: The sport stadium is turning darker.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sport stadium is becoming brighter.\nOption 2: The sport stadium is turning darker.", "gt-answer": "Option 2: The sport stadium is turning darker.", "video-llm-prediction": "Option 2: The sport stadium is turning darker.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sport stadium is becoming brighter.\nSentence B: The sport stadium is turning darker.", "gt-answer": "Sentence B: The sport stadium is turning darker.", "video-llm-prediction": "Sentence A: The sport stadium is becoming brighter.", "match_success": true, "rating": 0 } ] }, "1053334574_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The black ink is shrinking into the center.\nSentence B: The black ink is staying in the same shape.", "gt-answer": "Sentence A: The black ink is shrinking into the center.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The black ink is shrinking into the center.\nCaption B: The black ink is splitting in half.", "gt-answer": "Caption A: The black ink is shrinking into the center.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The black ink is expanding from the center.\nOption 2: The black ink is shrinking into the center.", "gt-answer": "Option 2: The black ink is shrinking into the center.", "video-llm-prediction": "Option 1: The black ink is expanding from the center.", "match_success": true, "rating": 0 } ] }, "1016172301_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The 3D house model is being demolished.\nCaption B: The 3D house model is being constructed.", "gt-answer": "Caption A: The 3D house model is being demolished.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3D house model is being demolished.\nOption 2: The 3D house model is being constructed.", "gt-answer": "Option 1: The 3D house model is being demolished.", "video-llm-prediction": "Option 2: The 3D house model is being constructed.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D house model is being repaired.\nSentence B: The 3D house model is being demolished.", "gt-answer": "Sentence B: The 3D house model is being demolished.", "video-llm-prediction": "Sentence A: The 3D house model is being repaired.", "match_success": true, "rating": 0 } ] }, "1084736389_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The face is aging.\nCaption B: The face is morphing from a human into a chimpanzee.", "gt-answer": "Caption B: The face is morphing from a human into a chimpanzee.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The face is morphing from a chimpanzee into a human.\nOption 2: The face is morphing from a human into a chimpanzee.", "gt-answer": "Option 2: The face is morphing from a human into a chimpanzee.", "video-llm-prediction": "Option 1: The face is morphing from a chimpanzee into a human.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The face is morphing from a human into a chimpanzee.\nSentence B: The face is morphing from a chimpanzee into a human.", "gt-answer": "Sentence A: The face is morphing from a human into a chimpanzee.", "video-llm-prediction": "Sentence A: The face is morphing from a human into a chimpanzee.", "match_success": true, "rating": 1 } ] }, "1054494542_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The background is changing from pink to green.\nSentence B: The background is changing from blue to pink.", "gt-answer": "Sentence B: The background is changing from blue to pink.", "video-llm-prediction": "Sentence B: The background is changing from blue to pink.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The background is changing from blue to pink.\nOption 2: The background is changing from green to pink.", "gt-answer": "Option 1: The background is changing from blue to pink.", "video-llm-prediction": "Option 1: The background is changing from blue to pink.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The background is changing from blue to pink.\nCaption B: The background is changing from pink to blue.", "gt-answer": "Caption A: The background is changing from blue to pink.", "video-llm-prediction": "Caption B: The background is changing from pink to blue.", "match_success": true, "rating": 0 } ] }, "1055194940_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The insect is transforming from butterfly into pupa.\nSentence B: The insect is transforming from pupa into butterfly.", "gt-answer": "Sentence A: The insect is transforming from butterfly into pupa.", "video-llm-prediction": "Sentence A: The insect is transforming from butterfly into pupa.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The insect is transforming from butterfly into pupa.\nOption 2: The insect is transforming from pupa into butterfly.", "gt-answer": "Option 1: The insect is transforming from butterfly into pupa.", "video-llm-prediction": "Option 2: The insect is transforming from pupa into butterfly.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The insect is transforming from butterfly into pupa.\nCaption B: The insect is transforming from pupa into butterfly.", "gt-answer": "Caption A: The insect is transforming from butterfly into pupa.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1079384099_reverse": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The 3D pixel is transforming from the shape of a white square into a flower.\nCaption B: The 3D pixel is transforming from the shape of a flower into a white square.", "gt-answer": "Caption B: The 3D pixel is transforming from the shape of a flower into a white square.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D pixel is transforming from a white square into the shape of a flower.\nSentence B: The 3D pixel is transforming from the shape of a flower into a white square.", "gt-answer": "Sentence B: The 3D pixel is transforming from the shape of a flower into a white square.", "video-llm-prediction": "Sentence A: The 3D pixel is transforming from a white square into the shape of a flower.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The final shape of the 3D pixel is a star.\nOption 2: The 3D pixel is transforming from the shape of a flower into a white square.", "gt-answer": "Option 2: The 3D pixel is transforming from the shape of a flower into a white square.", "video-llm-prediction": "Option 1: The final shape of the 3D pixel is a star.", "match_success": true, "rating": 0 } ] }, "1099811331_reverse": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The 3d heart is gradually disappearing.\nOption 2: The 3d heart is gradually appearing.", "gt-answer": "Option 1: The 3d heart is gradually disappearing.", "video-llm-prediction": "Option 2: The 3d heart is gradually appearing.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The 3d heart is gradually disappearing.\nCaption B: The size of the 3d heart is growing.", "gt-answer": "Caption A: The 3d heart is gradually disappearing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3d heart is reducing in size.\nSentence B: The 3d heart is gradually disappearing.", "gt-answer": "Sentence B: The 3d heart is gradually disappearing.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1093340469_reverse": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The room is staying the same brightness.\nSentence B: The room is turning brighter.", "gt-answer": "Sentence B: The room is turning brighter.", "video-llm-prediction": "Sentence A: The room is staying the same brightness.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The room is turning brighter.\nCaption B: The room is turning darker.", "gt-answer": "Caption A: The room is turning brighter.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The word that best describes the change in the room is darkening.\nOption 2: The room is turning brighter.", "gt-answer": "Option 2: The room is turning brighter.", "video-llm-prediction": "Option 1: The word that best describes the change in the room is darkening.", "match_success": true, "rating": 0 } ] }, "1111601171": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The sphere building is changing from green to blue.\nOption 2: The sphere building is changing from blue to green.", "gt-answer": "Option 1: The sphere building is changing from green to blue.", "video-llm-prediction": "Option 1: The sphere building is changing from green to blue.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The sphere building is changing from green to blue.\nSentence B: The sphere building is changing from blue to red.", "gt-answer": "Sentence A: The sphere building is changing from green to blue.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The sphere building is staying in the same color.\nCaption B: The sphere building is changing from green to blue.", "gt-answer": "Caption B: The sphere building is changing from green to blue.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1086105089": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The building is being constructed.\nSentence B: The building is demolishing.", "gt-answer": "Sentence A: The building is being constructed.", "video-llm-prediction": "Sentence A: The building is being constructed.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The building is being constructed.\nOption 2: The building is growing wider.", "gt-answer": "Option 1: The building is being constructed.", "video-llm-prediction": "Option 1: The building is being constructed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The building is being deconstructed.\nCaption B: The building is being constructed.", "gt-answer": "Caption B: The building is being constructed.", "video-llm-prediction": "Caption B: The building is being constructed.", "match_success": true, "rating": 1 } ] }, "1058498242": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The 3D pixels are changing from a cuboid into the shape of a man.\nCaption B: The 3D pixels are changing from the shape of a man into a cuboid.", "gt-answer": "Caption A: The 3D pixels are changing from a cuboid into the shape of a man.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3D pixels are changing from a cuboid into the shape of a man.\nOption 2: The 3D pixels are changing from the shape of a man into a cuboid.", "gt-answer": "Option 1: The 3D pixels are changing from a cuboid into the shape of a man.", "video-llm-prediction": "Option 1: The 3D pixels are changing from a cuboid into the shape of a man.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D pixels are changing from a cuboid into the shape of a man.\nSentence B: The 3D pixels are changing from the shape of a man into a cuboid.", "gt-answer": "Sentence A: The 3D pixels are changing from a cuboid into the shape of a man.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1082268005": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The planet earth is assembling from toy bricks.\nOption 2: The planet earth is disassembling and disappearing.", "gt-answer": "Option 1: The planet earth is assembling from toy bricks.", "video-llm-prediction": "Option 1: The planet earth is assembling from toy bricks.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The planet earth is splitting into two halves.\nSentence B: The planet earth is assembling from toy bricks.", "gt-answer": "Sentence B: The planet earth is assembling from toy bricks.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The planet earth is disassembling and disappearing.\nCaption B: The planet earth is assembling from toy bricks.", "gt-answer": "Caption B: The planet earth is assembling from toy bricks.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1070711428": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The glacier is assembling and rising from water.\nOption 2: The glacier is breaking and falling in water.", "gt-answer": "Option 2: The glacier is breaking and falling in water.", "video-llm-prediction": "Option 2: The glacier is breaking and falling in water.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The glacier is assembling and rising from water.\nCaption B: The glacier is breaking and falling in water.", "gt-answer": "Caption B: The glacier is breaking and falling in water.", "video-llm-prediction": "Caption A: The glacier is assembling and rising from water.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The glacier is assembling and rising from water.\nSentence B: The glacier is breaking and falling in water.", "gt-answer": "Sentence B: The glacier is breaking and falling in water.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1057447372": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The sport stadium is turning darker.\nOption 2: The sport stadium is turning brighter.", "gt-answer": "Option 2: The sport stadium is turning brighter.", "video-llm-prediction": "Option 2: The sport stadium is turning brighter.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The brightness of the sport stadium is staying the same.\nSentence B: The sport stadium is turning brighter.", "gt-answer": "Sentence B: The sport stadium is turning brighter.", "video-llm-prediction": "Sentence A: The brightness of the sport stadium is staying the same.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The sport stadium is turning darker.\nCaption B: The sport stadium is turning brighter.", "gt-answer": "Caption B: The sport stadium is turning brighter.", "video-llm-prediction": "Caption B: The sport stadium is turning brighter.", "match_success": true, "rating": 1 } ] }, "1053334574": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The black ink is staying in the same shape.\nSentence B: The black ink is expanding from the center.", "gt-answer": "Sentence B: The black ink is expanding from the center.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The black ink is splitting in half.\nCaption B: The black ink is expanding from the center.", "gt-answer": "Caption B: The black ink is expanding from the center.", "video-llm-prediction": "Caption B: The black ink is expanding from the center.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The black ink is expanding from the center.\nOption 2: The black ink is shrinking into the center.", "gt-answer": "Option 1: The black ink is expanding from the center.", "video-llm-prediction": "Option 1: The black ink is expanding from the center.", "match_success": true, "rating": 1 } ] }, "1016172301": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D house model is being deconstructed.\nSentence B: The 3D house model is being constructed.", "gt-answer": "Sentence B: The 3D house model is being constructed.", "video-llm-prediction": "Sentence A: The 3D house model is being deconstructed.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3D house model is being constructed.\nOption 2: The 3D house model is being demolished.", "gt-answer": "Option 1: The 3D house model is being constructed.", "video-llm-prediction": "Option 1: The 3D house model is being constructed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The 3D house model is being repaired.\nCaption B: The 3D house model is being constructed.", "gt-answer": "Caption B: The 3D house model is being constructed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1084736389": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The face is aging.\nCaption B: The face is morphing from a chimpanzee into a human.", "gt-answer": "Caption B: The face is morphing from a chimpanzee into a human.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The face is morphing from a chimpanzee into a human.\nSentence B: The face is morphing from a human into a chimpanzee.", "gt-answer": "Sentence A: The face is morphing from a chimpanzee into a human.", "video-llm-prediction": "Sentence A: The face is morphing from a chimpanzee into a human.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The face is morphing from a human into a chimpanzee.\nOption 2: The face is morphing from a chimpanzee into a human.", "gt-answer": "Option 2: The face is morphing from a chimpanzee into a human.", "video-llm-prediction": "Option 1: The face is morphing from a human into a chimpanzee.", "match_success": true, "rating": 0 } ] }, "1054494542": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The background is changing from pink to green.\nOption 2: The background is changing from pink to blue.", "gt-answer": "Option 2: The background is changing from pink to blue.", "video-llm-prediction": "Option 2: The background is changing from pink to blue.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The background is changing from pink to blue.\nSentence B: The background is changing from green to pink.", "gt-answer": "Sentence A: The background is changing from pink to blue.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The background is changing from pink to blue.\nCaption B: The background is changing from blue to pink.", "gt-answer": "Caption A: The background is changing from pink to blue.", "video-llm-prediction": "Caption B: The background is changing from blue to pink.", "match_success": true, "rating": 0 } ] }, "1055194940": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The insect is transforming from pupa into butterfly.\nSentence B: The insect is remaining as a butterfly.", "gt-answer": "Sentence A: The insect is transforming from pupa into butterfly.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The insect is transforming from pupa into butterfly.\nCaption B: The insect is transforming from butterfly into pupa.", "gt-answer": "Caption A: The insect is transforming from pupa into butterfly.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The insect is transforming from pupa into butterfly.\nOption 2: The insect is transforming from butterfly into pupa.", "gt-answer": "Option 1: The insect is transforming from pupa into butterfly.", "video-llm-prediction": "Option 1: The insect is transforming from pupa into butterfly.", "match_success": true, "rating": 1 } ] }, "1079384099": { "attribute_change": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D pixel is transforming from the shape of a flower into a white square.\nSentence B: The 3D pixel is transforming from a white square into the shape of a flower.", "gt-answer": "Sentence B: The 3D pixel is transforming from a white square into the shape of a flower.", "video-llm-prediction": "Sentence A: The 3D pixel is transforming from the shape of a flower into a white square.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The 3D pixel is transforming from the shape of a heart into a triangle.\nCaption B: The 3D pixel is transforming from a white square into the shape of a flower.", "gt-answer": "Caption B: The 3D pixel is transforming from a white square into the shape of a flower.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3D pixel is transforming from a white square into the shape of a flower.\nOption 2: The 3D pixel is transforming from the shape of a flower into a white square.", "gt-answer": "Option 1: The 3D pixel is transforming from a white square into the shape of a flower.", "video-llm-prediction": "Option 1: The 3D pixel is transforming from a white square into the shape of a flower.", "match_success": true, "rating": 1 } ] }, "1099811331": { "attribute_change": [ { "question": "Which caption matches the video better?\nCaption A: The 3D heart is reducing in size.\nCaption B: The 3D heart is gradually appearing.", "gt-answer": "Caption B: The 3D heart is gradually appearing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The 3D heart is gradually appearing.\nOption 2: The 3D heart is gradually disappearing.", "gt-answer": "Option 1: The 3D heart is gradually appearing.", "video-llm-prediction": "Option 1: The 3D heart is gradually appearing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The 3D heart is gradually appearing.\nSentence B: The 3D heart is growing in size.", "gt-answer": "Sentence A: The 3D heart is gradually appearing.", "video-llm-prediction": "Sentence A: The 3D heart is gradually appearing.", "match_success": true, "rating": 1 } ] }, "1093340469": { "attribute_change": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The room is staying the same brightness.\nOption 2: The room is turning darker.", "gt-answer": "Option 2: The room is turning darker.", "video-llm-prediction": "Option 2: The room is turning darker.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The room is turning brighter.\nSentence B: The room is turning darker.", "gt-answer": "Sentence B: The room is turning darker.", "video-llm-prediction": "Sentence A: The room is turning brighter.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The room is turning darker.\nCaption B: The room is turning brighter.", "gt-answer": "Caption A: The room is turning darker.", "video-llm-prediction": "Caption B: The room is turning brighter.", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The ice cream melts first and then the sun rises.\nCaption B: The sun is rising and the ice cream is melting at the same time.", "gt-answer": "Caption B: The sun is rising and the ice cream is melting at the same time.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The sun is rising and the ice cream is melting at the same time.\nOption 2: The ice cream melts after the sun rises.", "gt-answer": "Option 1: The sun is rising and the ice cream is melting at the same time.", "video-llm-prediction": "Option 1: The sun is rising and the ice cream is melting at the same time.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream melts first before the sun rises.\nSentence B: The sun is rising and the ice cream is melting at the same time.", "gt-answer": "Sentence B: The sun is rising and the ice cream is melting at the same time.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_1": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream melts first and then the sun rises.\nSentence B: The sun rises and the ice cream melts at the same time.", "gt-answer": "Sentence A: The ice cream melts first and then the sun rises.", "video-llm-prediction": "Sentence A: The ice cream melts first and then the sun rises.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The sun rises first and then the ice cream melts.\nCaption B: The ice cream melts first and then the sun rises.", "gt-answer": "Caption B: The ice cream melts first and then the sun rises.", "video-llm-prediction": "Caption B: The ice cream melts first and then the sun rises.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Both events happen simultaneously, the sun rises and the ice cream melts.\nOption 2: The ice cream melts first and then the sun rises.", "gt-answer": "Option 2: The ice cream melts first and then the sun rises.", "video-llm-prediction": "Option 1: Both events happen simultaneously, the sun rises and the ice cream melts.", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_2": { "order": [ { "question": "Which caption matches the video better?\nCaption A: In the video, the sun rises first and then the ice cream melts.\nCaption B: Both events happen simultaneously, the sun rises and the ice cream melts.", "gt-answer": "Caption A: In the video, the sun rises first and then the ice cream melts.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The ice cream melts before the sun rises.\nSentence B: In the video, the sun rises first and then the ice cream melts.", "gt-answer": "Sentence B: In the video, the sun rises first and then the ice cream melts.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Before the sun rose, the ice cream melted.\nOption 2: In the video, the sun rises first and then the ice cream melts.", "gt-answer": "Option 2: In the video, the sun rises first and then the ice cream melts.", "video-llm-prediction": "Option 1: Before the sun rose, the ice cream melted.", "match_success": true, "rating": 0 } ] }, "1024867412_1034049020_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A girl is walking on the street while a dog is simultaneously driving.\nOption 2: A girl is walking on the street, then a dog is driving.", "gt-answer": "Option 1: A girl is walking on the street while a dog is simultaneously driving.", "video-llm-prediction": "Option 1: A girl is walking on the street while a dog is simultaneously driving.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A dog is driving, then a girl is walking on the street.\nCaption B: A girl is walking on the street while a dog is simultaneously driving.", "gt-answer": "Caption B: A girl is walking on the street while a dog is simultaneously driving.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A girl is walking on the street while a dog is simultaneously driving.\nSentence B: A girl is walking on the street, after a dog is driving.", "gt-answer": "Sentence A: A girl is walking on the street while a dog is simultaneously driving.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1024867412_1034049020_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: A girl is walking on the street, then a dog is driving in the video.\nCaption B: In the video, a dog is driving first, followed by a girl walking on the street.", "gt-answer": "Caption B: In the video, a dog is driving first, followed by a girl walking on the street.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Both events, a dog driving and a girl walking on the street, are happening at the same time in the video.\nOption 2: In the video, a dog is driving first, followed by a girl walking on the street.", "gt-answer": "Option 2: In the video, a dog is driving first, followed by a girl walking on the street.", "video-llm-prediction": "Option 1: Both events, a dog driving and a girl walking on the street, are happening at the same time in the video.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A girl is walking on the street while a dog is simultaneously driving in the video.\nSentence B: In the video, a dog is driving first, followed by a girl walking on the street.", "gt-answer": "Sentence B: In the video, a dog is driving first, followed by a girl walking on the street.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1024867412_1034049020_2": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, first a girl is walking on the street, and then a dog is driving.\nSentence B: A dog is driving, and then a girl is walking on the street.", "gt-answer": "Sentence A: In the video, first a girl is walking on the street, and then a dog is driving.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Both events of a girl walking on the street and a dog driving happen at the same time.\nCaption B: In the video, first a girl is walking on the street, and then a dog is driving.", "gt-answer": "Caption B: In the video, first a girl is walking on the street, and then a dog is driving.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A dog is driving, followed by a girl walking on the street.\nOption 2: In the video, first a girl is walking on the street, and then a dog is driving.", "gt-answer": "Option 2: In the video, first a girl is walking on the street, and then a dog is driving.", "video-llm-prediction": "Option 2: In the video, first a girl is walking on the street, and then a dog is driving.", "match_success": true, "rating": 1 } ] }, "1096238125_1098970151_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Two people lifting weights and a cat licking its paw happening simultaneously.\nOption 2: Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "Option 1: Two people lifting weights and a cat licking its paw happening simultaneously.", "video-llm-prediction": "Option 1: Two people lifting weights and a cat licking its paw happening simultaneously.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Two people lifting weights and a cat licking its paw happening simultaneously.\nCaption B: A cat is licking its paw and then two people are lifting weights.", "gt-answer": "Caption A: Two people lifting weights and a cat licking its paw happening simultaneously.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, two people are lifting weights first, then a cat is licking its paw.\nSentence B: Two people lifting weights and a cat licking its paw happening simultaneously.", "gt-answer": "Sentence B: Two people lifting weights and a cat licking its paw happening simultaneously.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1096238125_1098970151_1": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A cat is licking its paw and then two people are lifting weights in the video.\nOption 2: In the video, two people are lifting weights and then a cat is licking its paw.", "gt-answer": "Option 2: In the video, two people are lifting weights and then a cat is licking its paw.", "video-llm-prediction": "Option 2: In the video, two people are lifting weights and then a cat is licking its paw.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A cat is licking its paw before two people are lifting weights in the video.\nSentence B: In the video, two people are lifting weights and then a cat is licking its paw.", "gt-answer": "Sentence B: In the video, two people are lifting weights and then a cat is licking its paw.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: In the video, two people are lifting weights and then a cat is licking its paw.\nCaption B: A cat is licking its paw and then two people are lifting weights in the video.", "gt-answer": "Caption A: In the video, two people are lifting weights and then a cat is licking its paw.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1096238125_1098970151_2": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A cat is seen licking its paw first, followed by two people lifting weights.\nSentence B: Two people are lifting weights before a cat is seen licking its paw.", "gt-answer": "Sentence A: A cat is seen licking its paw first, followed by two people lifting weights.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Both events, two people lifting weights and a cat licking paw, happen at the same time in the video.\nOption 2: A cat is seen licking its paw first, followed by two people lifting weights.", "gt-answer": "Option 2: A cat is seen licking its paw first, followed by two people lifting weights.", "video-llm-prediction": "Option 1: Both events, two people lifting weights and a cat licking paw, happen at the same time in the video.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: Two people are lifting weights first, followed by a cat licking its paw.\nCaption B: A cat is seen licking its paw first, followed by two people lifting weights.", "gt-answer": "Caption B: A cat is seen licking its paw first, followed by two people lifting weights.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1069717165_1041584314_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: First, a woman is showing different expressions; then, a man is showing different expressions.\nCaption B: The woman and man are showing their expressions simultaneously.", "gt-answer": "Caption B: The woman and man are showing their expressions simultaneously.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man presents his expressions first, followed by the woman.\nSentence B: The woman and man are showing their expressions simultaneously.", "gt-answer": "Sentence B: The woman and man are showing their expressions simultaneously.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman presents her expressions first, followed by the man.\nOption 2: The woman and man are showing their expressions simultaneously.", "gt-answer": "Option 2: The woman and man are showing their expressions simultaneously.", "video-llm-prediction": "Option 1: The woman presents her expressions first, followed by the man.", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: First, a woman is showing different expressions; then, a man is showing different expressions.\nCaption B: Both the woman and the man are showing different expressions at the same time.", "gt-answer": "Caption A: First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: First, a woman is showing different expressions; then, a man is showing different expressions.\nSentence B: The man presents his expressions first, followed by the woman.", "gt-answer": "Sentence A: First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: First, a woman is showing different expressions; then, a man is showing different expressions.\nOption 2: In the video, the woman and man are showing their expressions simultaneously.", "gt-answer": "Option 1: First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "Option 1: First, a woman is showing different expressions; then, a man is showing different expressions.", "match_success": true, "rating": 1 } ] }, "1069717165_1041584314_2": { "order": [ { "question": "Which caption matches the video better?\nCaption A: First, a man is showing different expressions; then, a woman is showing different expressions.\nCaption B: Both the woman and the man are showing different expressions at the same time.", "gt-answer": "Caption A: First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman presents his expressions first, followed by the man.\nOption 2: First, a man is showing different expressions; then, a woman is showing different expressions.", "gt-answer": "Option 2: First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "Option 1: The woman presents his expressions first, followed by the man.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman and man are showing their expressions simultaneously.\nSentence B: First, a man is showing different expressions; then, a woman is showing different expressions.", "gt-answer": "Sentence B: First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: Fire ball expanding and earth spinning are happening together.\nCaption B: The fire ball is expanding before the earth spinning.", "gt-answer": "Caption A: Fire ball expanding and earth spinning are happening together.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Fire ball expanding and earth spinning are happening together.\nOption 2: The fire ball is expanding after the earth spinning.", "gt-answer": "Option 1: Fire ball expanding and earth spinning are happening together.", "video-llm-prediction": "Option 1: Fire ball expanding and earth spinning are happening together.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The fire ball is expanding first, followed by the earth spinning.\nSentence B: Fire ball expanding and earth spinning are happening together.", "gt-answer": "Sentence B: Fire ball expanding and earth spinning are happening together.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_1": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Both events, fire ball expanding and earth spinning, happen together.\nSentence B: The earth is spinning before fire ball expanding.", "gt-answer": "Sentence B: The earth is spinning before fire ball expanding.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The earth is spinning before fire ball expanding.\nCaption B: The fire ball is expanding before the earth spinning.", "gt-answer": "Caption A: The earth is spinning before fire ball expanding.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The earth is spinning before fire ball expanding.\nOption 2: The fire ball is expanding before the earth spinning.", "gt-answer": "Option 1: The earth is spinning before fire ball expanding.", "video-llm-prediction": "Option 2: The fire ball is expanding before the earth spinning.", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The fire ball is expanding before the earth spinning.\nOption 2: Both events, fire ball expanding and earth spinning, happen together.", "gt-answer": "Option 1: The fire ball is expanding before the earth spinning.", "video-llm-prediction": "Option 2: Both events, fire ball expanding and earth spinning, happen together.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The fire ball is expanding after the earth spinning.\nCaption B: The fire ball is expanding before the earth spinning.", "gt-answer": "Caption B: The fire ball is expanding before the earth spinning.", "video-llm-prediction": "Caption B: The fire ball is expanding before the earth spinning.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Both events, fire ball expanding and earth spinning, happen together.\nSentence B: The fire ball is expanding before the earth spinning.", "gt-answer": "Sentence B: The fire ball is expanding before the earth spinning.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.\nCaption B: A person is picking up a pineapple first, then a squirrel is foraging in the video.", "gt-answer": "Caption A: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.\nOption 2: A squirrel is foraging first, then a person is picking up a pineapple in the video.", "gt-answer": "Option 1: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.", "video-llm-prediction": "Option 1: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.\nSentence B: The events in the video are happening sequentially, with the person picking up a pineapple before the squirrel starts foraging.", "gt-answer": "Sentence A: In the video, both a person picking up a pineapple and a squirrel foraging are happening concurrently.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1058907236_1021488277_1": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: First, a squirrel is foraging; then, a person is picking up a pineapple.\nSentence B: A person is picking up a pineapple before a squirrel is foraging.", "gt-answer": "Sentence A: First, a squirrel is foraging; then, a person is picking up a pineapple.", "video-llm-prediction": "Sentence A: First, a squirrel is foraging; then, a person is picking up a pineapple.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: First, a squirrel is foraging; then, a person is picking up a pineapple.\nOption 2: Both events are happening simultaneously.", "gt-answer": "Option 1: First, a squirrel is foraging; then, a person is picking up a pineapple.", "video-llm-prediction": "Option 1: First, a squirrel is foraging; then, a person is picking up a pineapple.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: First, a squirrel is foraging; then, a person is picking up a pineapple.\nCaption B: First, a person is picking up a pineapple; then, a squirrel is foraging.", "gt-answer": "Caption A: First, a squirrel is foraging; then, a person is picking up a pineapple.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A person is picking up a pineapple and then a squirrel is foraging.\nOption 2: First, a squirrel is foraging; then, a person is picking up a pineapple.", "gt-answer": "Option 1: A person is picking up a pineapple and then a squirrel is foraging.", "video-llm-prediction": "Option 2: First, a squirrel is foraging; then, a person is picking up a pineapple.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is picking up a pineapple and then a squirrel is foraging.\nSentence B: First, a squirrel is foraging; then, a person is picking up a pineapple.", "gt-answer": "Sentence A: A person is picking up a pineapple and then a squirrel is foraging.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Both a person picking up a pineapple and a squirrel foraging are happening concurrently.\nCaption B: A person is picking up a pineapple and then a squirrel is foraging.", "gt-answer": "Caption B: A person is picking up a pineapple and then a squirrel is foraging.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1054717541_1047368344_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: In the video, a girl is jumping into water while a person is kneading dough.\nCaption B: A person is kneading dough followed by a girl jumping into water.", "gt-answer": "Caption A: In the video, a girl is jumping into water while a person is kneading dough.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person is kneading dough followed by a girl jumping into water.\nOption 2: In the video, a girl is jumping into water while a person is kneading dough.", "gt-answer": "Option 2: In the video, a girl is jumping into water while a person is kneading dough.", "video-llm-prediction": "Option 2: In the video, a girl is jumping into water while a person is kneading dough.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The person jumps into water after the girl kneads dough.\nSentence B: In the video, a girl is jumping into water while a person is kneading dough.", "gt-answer": "Sentence B: In the video, a girl is jumping into water while a person is kneading dough.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1054717541_1047368344_1": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a person is kneading dough followed by a girl jumping into water.\nOption 2: A girl jumping into water while a person kneading dough.", "gt-answer": "Option 1: In the video, a person is kneading dough followed by a girl jumping into water.", "video-llm-prediction": "Option 1: In the video, a person is kneading dough followed by a girl jumping into water.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A girl is jumping into water, followed by a person kneading dough.\nSentence B: In the video, a person is kneading dough followed by a girl jumping into water.", "gt-answer": "Sentence B: In the video, a person is kneading dough followed by a girl jumping into water.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: In the video, a person is kneading dough followed by a girl jumping into water.\nCaption B: A person is kneading dough after a girl jumping into water.", "gt-answer": "Caption A: In the video, a person is kneading dough followed by a girl jumping into water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1054717541_1047368344_2": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is kneading dough followed by a girl jumping into water in the video.\nSentence B: In the video, a girl is jumping into water first followed by a person kneading dough.", "gt-answer": "Sentence B: In the video, a girl is jumping into water first followed by a person kneading dough.", "video-llm-prediction": "Sentence A: A person is kneading dough followed by a girl jumping into water in the video.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a girl is jumping into water first followed by a person kneading dough.\nOption 2: Both events of a girl jumping into water and a person kneading dough occur at the same time.", "gt-answer": "Option 1: In the video, a girl is jumping into water first followed by a person kneading dough.", "video-llm-prediction": "Option 1: In the video, a girl is jumping into water first followed by a person kneading dough.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A girl jumping into water while a person kneading dough is shown in the video.\nCaption B: In the video, a girl is jumping into water first followed by a person kneading dough.", "gt-answer": "Caption B: In the video, a girl is jumping into water first followed by a person kneading dough.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1089201973_1086820415_0": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person kicking a football and a big wave are shown simultaneously.\nSentence B: A person is kicking a football and then a big wave is shown.", "gt-answer": "Sentence A: A person kicking a football and a big wave are shown simultaneously.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A big wave is shown and then a person is kicking a football.\nCaption B: A person kicking a football and a big wave are shown simultaneously.", "gt-answer": "Caption B: A person kicking a football and a big wave are shown simultaneously.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person kicking a football and a big wave are shown simultaneously.\nOption 2: A person is kicking a football, then a big wave is shown.", "gt-answer": "Option 1: A person kicking a football and a big wave are shown simultaneously.", "video-llm-prediction": "Option 2: A person is kicking a football, then a big wave is shown.", "match_success": true, "rating": 0 } ] }, "1089201973_1086820415_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: A person kicking a football and a big wave are shown simultaneously.\nCaption B: The order of events in the video is that a person is kicking football and a big wave is shown.", "gt-answer": "Caption B: The order of events in the video is that a person is kicking football and a big wave is shown.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The order of events in the video is that a person is kicking football and a big wave is shown.\nSentence B: A big wave is shown and then a person is kicking football.", "gt-answer": "Sentence A: The order of events in the video is that a person is kicking football and a big wave is shown.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The order of events in the video is that a person is kicking football and a big wave is shown.\nOption 2: The order of events in the video is that a big wave is shown and a person is kicking football.", "gt-answer": "Option 1: The order of events in the video is that a person is kicking football and a big wave is shown.", "video-llm-prediction": "Option 1: The order of events in the video is that a person is kicking football and a big wave is shown.", "match_success": true, "rating": 1 } ] }, "1089201973_1086820415_2": { "order": [ { "question": "Which caption matches the video better?\nCaption A: 1. A person kicking a football and a big wave are shown simultaneously.\nCaption B: The video begins with a big wave being shown, followed by a person kicking a football.", "gt-answer": "Caption B: The video begins with a big wave being shown, followed by a person kicking a football.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video begins with a big wave being shown, followed by a person kicking a football.\nSentence B: 2. A person is kicking a football before a big wave is shown.", "gt-answer": "Sentence A: The video begins with a big wave being shown, followed by a person kicking a football.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video begins with a big wave being shown, followed by a person kicking a football.\nOption 2: 3. The video begins with a person kicking a football, followed by a big wave being shown.", "gt-answer": "Option 1: The video begins with a big wave being shown, followed by a person kicking a football.", "video-llm-prediction": "Option 1: The video begins with a big wave being shown, followed by a person kicking a football.", "match_success": true, "rating": 1 } ] }, "1080990179_1086820415_0": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: First, a big wave is shown in the video, and then an apple is drying out.\nSentence B: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "gt-answer": "Sentence B: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "video-llm-prediction": "Sentence B: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, both events of an apple drying out and a big wave are shown simultaneously.\nOption 2: The event of an apple drying out occurs after showing a big wave.", "gt-answer": "Option 1: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "video-llm-prediction": "Option 1: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The event of an apple drying out occurs before showing a big wave.\nCaption B: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "gt-answer": "Caption B: In the video, both events of an apple drying out and a big wave are shown simultaneously.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1080990179_1086820415_1": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: An apple is drying out and then a big wave is shown.\nSentence B: A big wave is shown and then an apple is drying out.", "gt-answer": "Sentence A: An apple is drying out and then a big wave is shown.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: At the same time, an apple is drying out and a big wave is shown.\nCaption B: An apple is drying out and then a big wave is shown.", "gt-answer": "Caption B: An apple is drying out and then a big wave is shown.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: An apple is drying out and then a big wave is shown.\nOption 2: An apple is drying out before a big wave is shown.", "gt-answer": "Option 1: An apple is drying out and then a big wave is shown.", "video-llm-prediction": "Option 2: An apple is drying out before a big wave is shown.", "match_success": true, "rating": 0 } ] }, "1080990179_1086820415_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a big wave is shown first and then an apple is drying out.\nOption 2: An apple is drying out and then a big wave is shown.", "gt-answer": "Option 1: In the video, a big wave is shown first and then an apple is drying out.", "video-llm-prediction": "Option 1: In the video, a big wave is shown first and then an apple is drying out.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Both events occur simultaneously, an apple is drying out and a big wave is shown.\nSentence B: In the video, a big wave is shown first and then an apple is drying out.", "gt-answer": "Sentence B: In the video, a big wave is shown first and then an apple is drying out.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: In the video, a big wave is shown first and then an apple is drying out.\nCaption B: In the video, an apple is drying out first and then a big wave is shown.", "gt-answer": "Caption A: In the video, a big wave is shown first and then an apple is drying out.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1067268403_1064645467_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Wind turbines are rotating followed by a man doing exercise.\nOption 2: A man is doing exercise while wind turbines are rotating concurrently.", "gt-answer": "Option 2: A man is doing exercise while wind turbines are rotating concurrently.", "video-llm-prediction": "Option 2: A man is doing exercise while wind turbines are rotating concurrently.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A man is doing exercise while wind turbines are rotating concurrently.\nCaption B: A man doing exercise followed by wind turbines rotating.", "gt-answer": "Caption A: A man is doing exercise while wind turbines are rotating concurrently.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A man doing exercise followed by wind turbines rotating.\nSentence B: A man is doing exercise while wind turbines are rotating concurrently.", "gt-answer": "Sentence B: A man is doing exercise while wind turbines are rotating concurrently.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1067268403_1064645467_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: A man is doing exercise while wind turbines are rotating.\nCaption B: Wind turbines are rotating followed by a man doing exercise.", "gt-answer": "Caption B: Wind turbines are rotating followed by a man doing exercise.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A man is doing exercise before wind turbines rotating.\nSentence B: Wind turbines are rotating followed by a man doing exercise.", "gt-answer": "Sentence B: Wind turbines are rotating followed by a man doing exercise.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Wind turbines are rotating followed by a man doing exercise.\nOption 2: A man is doing exercise followed by wind turbines rotating.", "gt-answer": "Option 1: Wind turbines are rotating followed by a man doing exercise.", "video-llm-prediction": "Option 2: A man is doing exercise followed by wind turbines rotating.", "match_success": true, "rating": 0 } ] }, "1067268403_1064645467_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Wind turbines are rotating followed by a man doing exercise.\nOption 2: The video shows a man doing exercise followed by wind turbines rotating.", "gt-answer": "Option 2: The video shows a man doing exercise followed by wind turbines rotating.", "video-llm-prediction": "Option 1: Wind turbines are rotating followed by a man doing exercise.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video shows a man doing exercise followed by wind turbines rotating.\nSentence B: Wind turbines are rotating followed by a man doing exercise.", "gt-answer": "Sentence A: The video shows a man doing exercise followed by wind turbines rotating.", "video-llm-prediction": "Sentence A: The video shows a man doing exercise followed by wind turbines rotating.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A man is doing exercise concurrently with wind turbines rotating.\nCaption B: The video shows a man doing exercise followed by wind turbines rotating.", "gt-answer": "Caption B: The video shows a man doing exercise followed by wind turbines rotating.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_0": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Planet Earth is assembling from toy bricks and then viruses are dissolving.\nSentence B: Planet earth assembling and viruses dissolving are happening simultaneously.", "gt-answer": "Sentence B: Planet earth assembling and viruses dissolving are happening simultaneously.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: Planet earth assembling and viruses dissolving are happening simultaneously.\nCaption B: Viruses are dissolving and then planet Earth is assembling from toy bricks.", "gt-answer": "Caption A: Planet earth assembling and viruses dissolving are happening simultaneously.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Planet earth assembling and viruses dissolving are happening simultaneously.\nOption 2: Viruses are dissolving and then planet Earth is assembling from toy bricks.", "gt-answer": "Option 1: Planet earth assembling and viruses dissolving are happening simultaneously.", "video-llm-prediction": "Option 1: Planet earth assembling and viruses dissolving are happening simultaneously.", "match_success": true, "rating": 1 } ] }, "1082268005_1063373449_1": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Viruses are dissolving and then planet earth is assembling from toy bricks.\nOption 2: The video shows planet earth assembling from toy bricks and then viruses dissolving.", "gt-answer": "Option 2: The video shows planet earth assembling from toy bricks and then viruses dissolving.", "video-llm-prediction": "Option 2: The video shows planet earth assembling from toy bricks and then viruses dissolving.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video shows planet earth assembling from toy bricks and then viruses dissolving.\nSentence B: Planet earth assembling and viruses dissolving are happening simultaneously.", "gt-answer": "Sentence A: The video shows planet earth assembling from toy bricks and then viruses dissolving.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video shows planet earth assembling from toy bricks and then viruses dissolving.\nCaption B: Planet earth is assembling from toy bricks after viruses dissolving.", "gt-answer": "Caption A: The video shows planet earth assembling from toy bricks and then viruses dissolving.", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1082268005_1063373449_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.\nOption 2: Planet earth assembling and viruses dissolving are happening simultaneously.", "gt-answer": "Option 1: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.", "video-llm-prediction": "Option 1: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Planet earth is assembling from toy bricks first and then viruses dissolving.\nSentence B: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.", "gt-answer": "Sentence B: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: Planet earth is assembling from toy bricks first and then viruses dissolving.\nCaption B: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.", "gt-answer": "Caption B: In the video, viruses are dissolving first and then planet earth is assembling from toy bricks.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A light bulb is lighting up while the tree is growing up at the same time\nOption 2: A light bulb is lighting up and then the tree is growing up.", "gt-answer": "Option 1: A light bulb is lighting up while the tree is growing up at the same time", "video-llm-prediction": "Option 1: A light bulb is lighting up while the tree is growing up at the same time.", "match_success": false, "chatgpt-response": "Correct", "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A light bulb is lighting up while the tree is growing up at the same time\nSentence B: The tree is growing up and then a light bulb is lighting up.", "gt-answer": "Sentence A: A light bulb is lighting up while the tree is growing up at the same time", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The light bulb lights up after the tree grows.\nCaption B: A light bulb is lighting up while the tree is growing up at the same time", "gt-answer": "Caption B: A light bulb is lighting up while the tree is growing up at the same time", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1060403198_1049965795_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The tree is growing up and then a light bulb is lighting up.\nCaption B: A light bulb is lighting up while the tree is growing up at the same time", "gt-answer": "Caption A: The tree is growing up and then a light bulb is lighting up.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A light bulb is lighting up and then the tree is growing up.\nSentence B: The tree is growing up and then a light bulb is lighting up.", "gt-answer": "Sentence B: The tree is growing up and then a light bulb is lighting up.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The tree is growing up after a light bulb is lighting up.\nOption 2: The tree is growing up and then a light bulb is lighting up.", "gt-answer": "Option 2: The tree is growing up and then a light bulb is lighting up.", "video-llm-prediction": "Option 1: The tree is growing up after a light bulb is lighting up.", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_2": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The video shows a light bulb lighting up first and then the tree growing up.\nSentence B: The tree is growing up and then a light bulb is lighting up.", "gt-answer": "Sentence A: The video shows a light bulb lighting up first and then the tree growing up.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A light bulb is lighting up while the tree is growing up at the same time\nOption 2: The video shows a light bulb lighting up first and then the tree growing up.", "gt-answer": "Option 2: The video shows a light bulb lighting up first and then the tree growing up.", "video-llm-prediction": "Option 2: The video shows a light bulb lighting up first and then the tree growing up.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video shows a light bulb lighting up first and then the tree growing up.\nCaption B: The video shows the tree growing up first and then a light bulb lighting up.", "gt-answer": "Caption A: The video shows a light bulb lighting up first and then the tree growing up.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1091143117_1094219575_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, first a flower is wilting and then an eys is opening.\nOption 2: Both events of an eye opening and a flower wilting happen simultaneously in the video.", "gt-answer": "Option 2: Both events of an eye opening and a flower wilting happen simultaneously in the video.", "video-llm-prediction": "Option 1: In the video, first a flower is wilting and then an eys is opening.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: An eye is opening in the video, followed by a flower wilting.\nCaption B: Both events of an eye opening and a flower wilting happen simultaneously in the video.", "gt-answer": "Caption B: Both events of an eye opening and a flower wilting happen simultaneously in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: An eye is opening in the video, followed by a flower wilting.\nSentence B: Both events of an eye opening and a flower wilting happen simultaneously in the video.", "gt-answer": "Sentence B: Both events of an eye opening and a flower wilting happen simultaneously in the video.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1091143117_1094219575_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: Both events of an eye opening and a flower wilting happen simultaneously.\nCaption B: In the video, an eye is opening first and then a flower is wilting.", "gt-answer": "Caption B: In the video, an eye is opening first and then a flower is wilting.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A flower is wilting first, and then an eye is opening.\nSentence B: In the video, an eye is opening first and then a flower is wilting.", "gt-answer": "Sentence B: In the video, an eye is opening first and then a flower is wilting.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, an eye is opening first and then a flower is wilting.\nOption 2: A flower is wilting first, then an eye is opening.", "gt-answer": "Option 1: In the video, an eye is opening first and then a flower is wilting.", "video-llm-prediction": "Option 2: A flower is wilting first, then an eye is opening.", "match_success": true, "rating": 0 } ] }, "1091143117_1094219575_2": { "order": [ { "question": "Which caption matches the video better?\nCaption A: In the video, a flower is wilting first, and then an eye is opening.\nCaption B: An eye is opening first, then a flower is wilting in the video.", "gt-answer": "Caption A: In the video, a flower is wilting first, and then an eye is opening.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a flower is wilting first, and then an eye is opening.\nOption 2: Both events, a flower wilting and an eye opening, are happening simultaneously in the video.", "gt-answer": "Option 1: In the video, a flower is wilting first, and then an eye is opening.", "video-llm-prediction": "Option 2: In the video, a flower is wilting first, and then an eye is opening.", "match_success": false, "chatgpt-response": "Incorrect", "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, a flower is wilting first, and then an eye is opening.\nSentence B: An eye is opening before a flower wilts in the video.", "gt-answer": "Sentence A: In the video, a flower is wilting first, and then an eye is opening.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1086105089_1085910917_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: First, a building is being constructed; then, a woman is drinking water.\nOption 2: A building is being constructed while at the same time a woman is drinking water.", "gt-answer": "Option 2: A building is being constructed while at the same time a woman is drinking water.", "video-llm-prediction": "Option 2: A building is being constructed while at the same time a woman is drinking water.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A woman is drinking water happens before a building is being constructed.\nCaption B: A building is being constructed while at the same time a woman is drinking water.", "gt-answer": "Caption B: A building is being constructed while at the same time a woman is drinking water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A building is being constructed happens before a woman is drinking water.\nSentence B: A building is being constructed while at the same time a woman is drinking water.", "gt-answer": "Sentence B: A building is being constructed while at the same time a woman is drinking water.", "video-llm-prediction": "Sentence B: A building is being constructed while at the same time a woman is drinking water.", "match_success": true, "rating": 1 } ] }, "1086105089_1085910917_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: First, a building is being constructed; then, a woman is drinking water.\nCaption B: A woman is drinking water before a building is being constructed.", "gt-answer": "Caption A: First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A building is being constructed while at the same time a woman is drinking water.\nOption 2: First, a building is being constructed; then, a woman is drinking water.", "gt-answer": "Option 2: First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "Option 2: First, a building is being constructed; then, a woman is drinking water.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: First, a woman is drinking water; then, a building is being constructed.\nSentence B: First, a building is being constructed; then, a woman is drinking water.", "gt-answer": "Sentence B: First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1086105089_1085910917_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: First, a woman is drinking water; then, a building is being constructed.\nOption 2: A building is being constructed while at the same time a woman is drinking water.", "gt-answer": "Option 1: First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "Option 1: First, a woman is drinking water; then, a building is being constructed.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A building is being constructed happens before a woman is drinking water.\nSentence B: First, a woman is drinking water; then, a building is being constructed.", "gt-answer": "Sentence B: First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "Sentence B: First, a woman is drinking water; then, a building is being constructed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: First, a building is being constructed; then, a woman is drinking water.\nCaption B: First, a woman is drinking water; then, a building is being constructed.", "gt-answer": "Caption B: First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1034736653_1043054206_0": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: Women are running first, then cars are racing.\nOption 2: Woman running and car racing happen simultaneously.", "gt-answer": "Option 2: Woman running and car racing happen simultaneously.", "video-llm-prediction": "Option 2: Woman running and car racing happen simultaneously.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Cars are racing first, then women are running.\nCaption B: Woman running and car racing happen simultaneously.", "gt-answer": "Caption B: Woman running and car racing happen simultaneously.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Women are running first, then cars are racing.\nSentence B: Woman running and car racing happen simultaneously.", "gt-answer": "Sentence B: Woman running and car racing happen simultaneously.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1034736653_1043054206_1": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video shows women running first, followed by cars racing.\nOption 2: Woman running and car racing happen simultaneously.", "gt-answer": "Option 1: The video shows women running first, followed by cars racing.", "video-llm-prediction": "Option 2: The video shows woman running and car racing happening simultaneously.", "match_success": false, "chatgpt-response": "Incorrect", "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The cars are racing first, followed by women running.\nCaption B: The video shows women running first, followed by cars racing.", "gt-answer": "Caption B: The video shows women running first, followed by cars racing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The cars are racing first, followed by women running.\nSentence B: The video shows women running first, followed by cars racing.", "gt-answer": "Sentence B: The video shows women running first, followed by cars racing.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 } ] }, "1034736653_1043054206_2": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The cars are racing first, followed by women running.\nCaption B: Woman running and car racing happen simultaneously.", "gt-answer": "Caption A: The cars are racing first, followed by women running.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The cars are racing first, followed by women running.\nSentence B: The video shows women running first, followed by cars racing.", "gt-answer": "Sentence A: The cars are racing first, followed by women running.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Cars are racing after the women have started running.\nOption 2: The cars are racing first, followed by women running.", "gt-answer": "Option 2: The cars are racing first, followed by women running.", "video-llm-prediction": "Option 2: The cars are racing first, followed by women running.", "match_success": true, "rating": 1 } ] }, "1086423566_1094782389_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.\nCaption B: A dog is giving a high five to a woman, and then foods are added into a bowl.", "gt-answer": "Caption A: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.\nOption 2: A dog is giving a high five to a woman, and then foods are added into a bowl.", "gt-answer": "Option 1: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.", "video-llm-prediction": "Option 1: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.\nSentence B: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "gt-answer": "Sentence A: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1086423566_1094782389_1": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Foods are added into a bowl, and then a dog is giving a high five to a woman.\nSentence B: A dog is giving a high five to a woman, and then foods are added into a bowl.", "gt-answer": "Sentence A: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman.\nOption 2: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "gt-answer": "Option 2: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "video-llm-prediction": "Option 2: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A dog is giving a high five to a woman, and then foods are added into a bowl.\nCaption B: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "gt-answer": "Caption B: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_2": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.\nOption 2: Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman.", "gt-answer": "Option 1: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.", "video-llm-prediction": "Option 1: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Foods are added into a bowl, while at the same time a dog is giving a high five to a woman.\nCaption B: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.", "gt-answer": "Caption B: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.\nSentence B: Foods are added into a bowl, and then a dog is giving a high five to a woman.", "gt-answer": "Sentence A: In the video, a dog is giving a high five to a woman, and then foods are added into a bowl.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1053758117_1055413730_0": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The digital brain and the earth are spinning at the same time.\nSentence B: First, the digital brain is spinning and then the earth is spinning.", "gt-answer": "Sentence A: The digital brain and the earth are spinning at the same time.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The digital brain and the earth are spinning at the same time.\nOption 2: The earth is spinning first, followed by the digital brain spinning.", "gt-answer": "Option 1: The digital brain and the earth are spinning at the same time.", "video-llm-prediction": "Option 2: The earth is spinning first, followed by the digital brain spinning.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The video shows the earth spinning.\nCaption B: The digital brain and the earth are spinning at the same time.", "gt-answer": "Caption B: The digital brain and the earth are spinning at the same time.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1053758117_1055413730_1": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: First, the digital brain is spinning and then the earth is spinning.\nOption 2: The digital brain and the earth are spinning at the same time.", "gt-answer": "Option 1: First, the digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "Option 2: The digital brain and the earth are spinning at the same time.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, the earth is spinning before the digital brain starts spinning.\nSentence B: First, the digital brain is spinning and then the earth is spinning.", "gt-answer": "Sentence B: First, the digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: First, the digital brain is spinning and then the earth is spinning.\nCaption B: In the video, the earth is spinning before the digital brain starts spinning.", "gt-answer": "Caption A: First, the digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1053758117_1055413730_2": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The digital brain and the earth are spinning simultaneously.\nSentence B: In the video, the earth is spinning before the digital brain starts spinning.", "gt-answer": "Sentence B: In the video, the earth is spinning before the digital brain starts spinning.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, the earth is spinning before the digital brain starts spinning.\nOption 2: First, the digital brain is spinning and then the earth is spinning.", "gt-answer": "Option 1: In the video, the earth is spinning before the digital brain starts spinning.", "video-llm-prediction": "Option 1: In the video, the earth is spinning before the digital brain starts spinning.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A video showing the digital brain spinning and then the earth spinning.\nCaption B: In the video, the earth is spinning before the digital brain starts spinning.", "gt-answer": "Caption B: In the video, the earth is spinning before the digital brain starts spinning.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1076877854_1073914229_0": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Robotic arms are working, then trains are driving.\nSentence B: Trains are driving and robotic arms are working at the same time.", "gt-answer": "Sentence B: Trains are driving and robotic arms are working at the same time.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Trains are driving and robotic arms are working at the same time.\nOption 2: The robotic arms are working first, then the trains are driving.", "gt-answer": "Option 1: Trains are driving and robotic arms are working at the same time.", "video-llm-prediction": "Option 2: The robotic arms are working first, then the trains are driving.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: Trains are driving and robotic arms are working at the same time.\nCaption B: Trains are driving, then robotic arms are working.", "gt-answer": "Caption A: Trains are driving and robotic arms are working at the same time.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1076877854_1073914229_1": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The trains are driving first, and then robotic arms are working.\nSentence B: The robotic arms are working first, then the trains are driving.", "gt-answer": "Sentence B: The robotic arms are working first, then the trains are driving.", "video-llm-prediction": "Sentence B: The robotic arms are working first, then the trains are driving.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Both the robotic arms and trains are shown at the same time.\nOption 2: The robotic arms are working first, then the trains are driving.", "gt-answer": "Option 2: The robotic arms are working first, then the trains are driving.", "video-llm-prediction": "Option 2: The robotic arms are working first, then the trains are driving.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The robotic arms are working first, then the trains are driving.\nCaption B: The trains are driving first, and then robotic arms are working.", "gt-answer": "Caption A: The robotic arms are working first, then the trains are driving.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1076877854_1073914229_2": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: In the video, robotic arms are working and trains are driving at the same time.\nSentence B: First, trains are driving, then robotic arms are working.", "gt-answer": "Sentence B: First, trains are driving, then robotic arms are working.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: First, trains are driving, then robotic arms are working.\nOption 2: The robotic arms are working first, then the trains are driving.", "gt-answer": "Option 1: First, trains are driving, then robotic arms are working.", "video-llm-prediction": "Option 2: The robotic arms are working first, then the trains are driving.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The robotic arms are working first, then the trains are driving.\nCaption B: First, trains are driving, then robotic arms are working.", "gt-answer": "Caption B: First, trains are driving, then robotic arms are working.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1067268406_1067427023_0": { "order": [ { "question": "Which caption matches the video better?\nCaption A: Snow particles are melting, then a white car is driving.\nCaption B: In the video, a white car is driving while snow particles are melting simultaneously.", "gt-answer": "Caption B: In the video, a white car is driving while snow particles are melting simultaneously.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A white car is driving first, then snow particles are melting.\nSentence B: In the video, a white car is driving while snow particles are melting simultaneously.", "gt-answer": "Sentence B: In the video, a white car is driving while snow particles are melting simultaneously.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: In the video, a white car is driving while snow particles are melting simultaneously.\nOption 2: A white car is driving first, then snow particles are melting.", "gt-answer": "Option 1: In the video, a white car is driving while snow particles are melting simultaneously.", "video-llm-prediction": "Option 1: In the video, a white car is driving while snow particles are melting simultaneously.", "match_success": true, "rating": 1 } ] }, "1067268406_1067427023_1": { "order": [ { "question": "Which caption matches the video better?\nCaption A: A white car is driving first, then snow particles are melting.\nCaption B: Snow particles are melting, then a white car is driving.", "gt-answer": "Caption A: A white car is driving first, then snow particles are melting.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A white car is driving while snow particles are melting simultaneously.\nSentence B: A white car is driving first, then snow particles are melting.", "gt-answer": "Sentence B: A white car is driving first, then snow particles are melting.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Snow particles are melting, before a white car is driving.\nOption 2: A white car is driving first, then snow particles are melting.", "gt-answer": "Option 2: A white car is driving first, then snow particles are melting.", "video-llm-prediction": "Option 2: A white car is driving first, then snow particles are melting.", "match_success": true, "rating": 1 } ] }, "1067268406_1067427023_2": { "order": [ { "question": "Which caption matches the video better?\nCaption A: Snow particles are melting, then a white car is driving.\nCaption B: A white car is driving while snow particles are melting simultaneously.", "gt-answer": "Caption A: Snow particles are melting, then a white car is driving.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Snow particles are melting, then a white car is driving.\nOption 2: A white car is driving, then snow particles are melting.", "gt-answer": "Option 1: Snow particles are melting, then a white car is driving.", "video-llm-prediction": "Option 1: Snow particles are melting, then a white car is driving.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: Snow particles are melting, then a white car is driving.\nSentence B: A white car is driving first, then snow particles are melting.", "gt-answer": "Sentence A: Snow particles are melting, then a white car is driving.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1086286649": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The armored vehicles are driving.\nSentence B: The armored vehicles are loading people.", "gt-answer": "Sentence A: The armored vehicles are driving.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The armored vehicles are parked.\nCaption B: The armored vehicles are driving.", "gt-answer": "Caption B: The armored vehicles are driving.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The armored vehicles are driving.\nOption 2: The armored vehicles are firing.", "gt-answer": "Option 1: The armored vehicles are driving.", "video-llm-prediction": "Option 1: The armored vehicles are driving.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The armored vehicles are moving from right to left.\nSentence B: The armored vehicles are moving from left to right.", "gt-answer": "Sentence A: The armored vehicles are moving from right to left.", "video-llm-prediction": "Sentence A: The armored vehicles are moving from right to left.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The armored vehicles are approaching from the upper side of the screen.\nOption 2: The armored vehicles are moving from right to left.", "gt-answer": "Option 2: The armored vehicles are moving from right to left.", "video-llm-prediction": "Option 2: The armored vehicles are moving from right to left.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The armored vehicles are approaching from left to right.\nCaption B: The armored vehicles are moving from right to left.", "gt-answer": "Caption B: The armored vehicles are moving from right to left.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Which caption matches the video better?\nCaption A: The armored vehicles are stationary.\nCaption B: The armored vehicles are moving slowly.", "gt-answer": "Caption B: The armored vehicles are moving slowly.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The armored vehicles are moving rapidly.\nOption 2: The armored vehicles are moving slowly.", "gt-answer": "Option 2: The armored vehicles are moving slowly.", "video-llm-prediction": "Option 1: The armored vehicles are moving rapidly.", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The pace of the armored vehicles is fast.\nSentence B: The armored vehicles are moving slowly.", "gt-answer": "Sentence B: The armored vehicles are moving slowly.", "video-llm-prediction": "Sentence A: The pace of the armored vehicles is fast.", "match_success": true, "rating": 0 } ] }, "1093041749": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The dragon is breathing fire.\nSentence B: A video showing a dragon flying.", "gt-answer": "Sentence A: The dragon is breathing fire.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The dragon is breathing fire.\nOption 2: The dragon is swimming.", "gt-answer": "Option 1: The dragon is breathing fire.", "video-llm-prediction": "Option 1: The dragon is breathing fire.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The dragon is breathing fire.\nCaption B: The dragon is eating food.", "gt-answer": "Caption A: The dragon is breathing fire.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The dragon is flying to the sky and then breathing fire.\nOption 2: The dragon is landing from the sky and then breathing fire.", "gt-answer": "Option 2: The dragon is landing from the sky and then breathing fire.", "video-llm-prediction": "Option 1: The dragon is flying to the sky and then breathing fire.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The dragon is breathing fire and then flying to the sky.\nCaption B: The dragon is landing from the sky and then breathing fire.", "gt-answer": "Caption B: The dragon is landing from the sky and then breathing fire.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The dragon is landing from the sky and then breathing fire.\nSentence B: The dragon is breathing fire and then landing from the sky.", "gt-answer": "Sentence A: The dragon is landing from the sky and then breathing fire.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1076180768": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The knight is putting on armor.\nOption 2: The knight is drawing a sword from the sheath.", "gt-answer": "Option 2: The knight is drawing a sword from the sheath.", "video-llm-prediction": "Option 2: The knight is drawing a sword from the sheath.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The knight is drawing a sword from the sheath.\nSentence B: A video showing the knight wielding a spear.", "gt-answer": "Sentence A: The knight is drawing a sword from the sheath.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The knight is drawing a sword from the sheath.\nCaption B: The knight is shooting an arrow.", "gt-answer": "Caption A: The knight is drawing a sword from the sheath.", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "3406661033": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The man is propelling himself forward in a wheelchair.\nCaption B: The man is swimming.", "gt-answer": "Caption A: The man is propelling himself forward in a wheelchair.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is propelling himself forward in a wheelchair.\nOption 2: A video showing the man walking.", "gt-answer": "Option 1: The man is propelling himself forward in a wheelchair.", "video-llm-prediction": "Option 1: The man is propelling himself forward in a wheelchair.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is jumping.\nSentence B: The man is propelling himself forward in a wheelchair.", "gt-answer": "Sentence B: The man is propelling himself forward in a wheelchair.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man stood up from the wheelchair and then handed the document to colleagues.\nOption 2: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "gt-answer": "Option 2: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "video-llm-prediction": "Option 2: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man handed the document to colleagues and then propelled himself forward in the wheelchair.\nCaption B: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "gt-answer": "Caption B: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man handed the document to colleagues and then propelled himself forward in the wheelchair.\nSentence B: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "gt-answer": "Sentence B: The man first propelled himself forward in the wheelchair and then handed the document to colleagues.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "3406618583": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The woman is performing freestyle dance.\nCaption B: The woman is performing hip-hop.", "gt-answer": "Caption A: The woman is performing freestyle dance.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is performing freestyle dance.\nSentence B: The woman is doing ballet.", "gt-answer": "Sentence A: The woman is performing freestyle dance.", "video-llm-prediction": "Sentence A: The woman is performing freestyle dance.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A video showing the woman engaged in jazz dance.\nOption 2: The woman is performing freestyle dance.", "gt-answer": "Option 2: The woman is performing freestyle dance.", "video-llm-prediction": "Option 1: A video showing the woman engaged in jazz dance.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The camera is panning up and down around the girl.\nOption 2: The camera is panning left and right around the girl.", "gt-answer": "Option 1: The camera is panning up and down around the girl.", "video-llm-prediction": "Option 1: The camera is panning up and down around the girl.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The camera is rotating clockwise around the girl.\nCaption B: The camera is panning up and down around the girl.", "gt-answer": "Caption B: The camera is panning up and down around the girl.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The camera is zooming in and out around the girl.\nSentence B: The camera is panning up and down around the girl.", "gt-answer": "Sentence B: The camera is panning up and down around the girl.", "video-llm-prediction": "Sentence A: The camera is zooming in and out around the girl.", "match_success": true, "rating": 0 } ] }, "3405120819": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The chef is cutting dough.\nCaption B: The chef is shaping dough.", "gt-answer": "Caption B: The chef is shaping dough.", "video-llm-prediction": "Caption B: The chef is shaping dough.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The chef is shaping dough.\nOption 2: The chef is placing dough in a dish.", "gt-answer": "Option 1: The chef is shaping dough.", "video-llm-prediction": "Option 1: The chef is shaping dough.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The chef is shaping dough.\nSentence B: The chef is mixing dough with water.", "gt-answer": "Sentence A: The chef is shaping dough.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The chef is smiling at the camera and then shaping dough.\nSentence B: The chef is shaping dough and then smiling at the camera.", "gt-answer": "Sentence B: The chef is shaping dough and then smiling at the camera.", "video-llm-prediction": "Sentence A: The chef is smiling at the camera and then shaping dough.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The chef is smiling at the camera and then shaping dough.\nOption 2: The chef is shaping dough and then smiling at the camera.", "gt-answer": "Option 2: The chef is shaping dough and then smiling at the camera.", "video-llm-prediction": "Option 2: The chef is shaping dough and then smiling at the camera.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The chef is smiling at the camera and then shaping dough.\nCaption B: The chef is shaping dough and then smiling at the camera.", "gt-answer": "Caption B: The chef is shaping dough and then smiling at the camera.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "3405088753": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is buying bread in the video.\nSentence B: The woman is cooking soup.", "gt-answer": "Sentence A: The woman is buying bread in the video.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is eating an apple.\nCaption B: The woman is buying bread in the video.", "gt-answer": "Caption B: The woman is buying bread in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is buying bread in the video.\nOption 2: The woman is sleeping.", "gt-answer": "Option 1: The woman is buying bread in the video.", "video-llm-prediction": "Option 1: The woman is buying bread in the video.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The salesman is saying something to a woman and then packing up the bread for her.\nOption 2: The salesman is packing up the bread for the woman and then saying something to her.", "gt-answer": "Option 2: The salesman is packing up the bread for the woman and then saying something to her.", "video-llm-prediction": "Option 1: The salesman is saying something to a woman and then packing up the bread for her.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The salesman is saying something to a woman and then packing up the bread for her.\nCaption B: The salesman is packing up the bread for the woman and then saying something to her.", "gt-answer": "Caption B: The salesman is packing up the bread for the woman and then saying something to her.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The salesman is packing up the bread for the woman and then saying something to her.\nSentence B: The salesman is saying something to a woman and then packing up the bread for her.", "gt-answer": "Sentence A: The salesman is packing up the bread for the woman and then saying something to her.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "3401191309": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: An athletic man is taking off a prosthetic running blade.\nSentence B: The athletic man is putting on a prosthetic running blade.", "gt-answer": "Sentence A: An athletic man is taking off a prosthetic running blade.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: An athletic man is taking off a prosthetic running blade.\nCaption B: The athletic man is repairing a prosthetic running blade.", "gt-answer": "Caption A: An athletic man is taking off a prosthetic running blade.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: An athletic man is taking off a prosthetic running blade.\nOption 2: A video showing an athletic man running with a prosthetic blade.", "gt-answer": "Option 1: An athletic man is taking off a prosthetic running blade.", "video-llm-prediction": "Option 1: An athletic man is taking off a prosthetic running blade.", "match_success": true, "rating": 1 } ] }, "21218935": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is exercising.\nOption 2: The woman is cooking.", "gt-answer": "Option 1: The woman is exercising.", "video-llm-prediction": "Option 1: The woman is exercising.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A woman is sleeping.\nCaption B: The woman is exercising.", "gt-answer": "Caption B: The woman is exercising.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is exercising.\nSentence B: The woman is reading.", "gt-answer": "Sentence A: The woman is exercising.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ], "order": [ { "question": "Which caption matches the video better?\nCaption A: The woman first smiles at the camera and then does push ups.\nCaption B: The woman first does push ups and then smiles at the camera.", "gt-answer": "Caption B: The woman first does push ups and then smiles at the camera.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman first smiles at the camera and then does push ups.\nSentence B: The woman first does push ups and then smiles at the camera.", "gt-answer": "Sentence B: The woman first does push ups and then smiles at the camera.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman first smiles at the camera and then does push ups.\nOption 2: The woman first does push ups and then smiles at the camera.", "gt-answer": "Option 2: The woman first does push ups and then smiles at the camera.", "video-llm-prediction": "Option 1: The woman first smiles at the camera and then does push ups.", "match_success": true, "rating": 0 } ] }, "5395244": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is walking across the pebble creek.\nOption 2: The woman is canoeing across the pebble creek.", "gt-answer": "Option 1: The woman is walking across the pebble creek.", "video-llm-prediction": "Option 1: The woman is walking across the pebble creek.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is swimming across the pebble creek.\nSentence B: The woman is walking across the pebble creek.", "gt-answer": "Sentence B: The woman is walking across the pebble creek.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The woman is running across the pebble creek.\nCaption B: The woman is walking across the pebble creek.", "gt-answer": "Caption B: The woman is walking across the pebble creek.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1037628617": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is pressing a keyboard key and rotating a jog dial.\nSentence B: A person is clicking button and rolling wheel on a mouse.", "gt-answer": "Sentence B: A person is clicking button and rolling wheel on a mouse.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is tapping a touchpad and scrolling with two fingers.\nOption 2: A person is clicking button and rolling wheel on a mouse.", "gt-answer": "Option 2: A person is clicking button and rolling wheel on a mouse.", "video-llm-prediction": "Option 2: A person is clicking button and rolling wheel on a mouse.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A video showing a person's action of tapping a touchpad and scrolling with two fingers.\nCaption B: A person is clicking button and rolling wheel on a mouse.", "gt-answer": "Caption B: A person is clicking button and rolling wheel on a mouse.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1066801717": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is cutting a bouquet of daffodils.\nOption 2: The woman is arranging a bouquet of daffodils.", "gt-answer": "Option 2: The woman is arranging a bouquet of daffodils.", "video-llm-prediction": "Option 2: The woman is arranging a bouquet of daffodils.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is arranging a bouquet of daffodils.\nCaption B: A video showing a woman watering a bouquet of daffodils.", "gt-answer": "Caption A: The woman is arranging a bouquet of daffodils.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is planting a bouquet of daffodils.\nSentence B: The woman is arranging a bouquet of daffodils.", "gt-answer": "Sentence B: The woman is arranging a bouquet of daffodils.", "video-llm-prediction": "Sentence B: The woman is arranging a bouquet of daffodils.", "match_success": true, "rating": 1 } ] }, "1088428381": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is storing items in a gift box.\nSentence B: A woman is opening a gift box in the video.", "gt-answer": "Sentence B: A woman is opening a gift box in the video.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A woman is opening a gift box in the video.\nOption 2: The woman is wrapping a gift box.", "gt-answer": "Option 1: A woman is opening a gift box in the video.", "video-llm-prediction": "Option 1: A woman is opening a gift box in the video.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A woman is opening a gift box in the video.\nCaption B: The woman is delivering a gift box.", "gt-answer": "Caption A: A woman is opening a gift box in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1069593640": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is putting a towel on her neck.\nSentence B: The woman is drying hair with a towel.", "gt-answer": "Sentence A: The woman is putting a towel on her neck.", "video-llm-prediction": "Sentence A: The woman is putting a towel on her neck.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is putting a towel on her neck.\nCaption B: The woman is washing face with a towel.", "gt-answer": "Caption A: The woman is putting a towel on her neck.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The towel is being used to dry the woman's hair.\nOption 2: The woman is putting a towel on her neck.", "gt-answer": "Option 2: The woman is putting a towel on her neck.", "video-llm-prediction": "Option 1: The towel is being used to dry the woman's hair.", "match_success": true, "rating": 0 } ] }, "8307961": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is chatting with a woman while walking and then showing something on his tablet to her.\nSentence B: The man is walking and simultaneously showing something on his tablet to a woman.", "gt-answer": "Sentence A: The man is chatting with a woman while walking and then showing something on his tablet to her.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is chatting with a woman while walking and then showing something on his tablet to her.\nOption 2: The man is showing something on his tablet to a woman and then chatting with her while walking.", "gt-answer": "Option 1: The man is chatting with a woman while walking and then showing something on his tablet to her.", "video-llm-prediction": "Option 1: The man is chatting with a woman while walking and then showing something on his tablet to her.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is showing something on his tablet to a woman and then chatting with her while walking.\nCaption B: The man is chatting with a woman while walking and then showing something on his tablet to her.", "gt-answer": "Caption B: The man is chatting with a woman while walking and then showing something on his tablet to her.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "15439453": { "action": [ { "question": "Which caption matches the video better?\nCaption A: In the video, tango dancing and playing the piano are shown.\nCaption B: The video shows tango dancing and playing the saxophone.", "gt-answer": "Caption B: The video shows tango dancing and playing the saxophone.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The video shows ballet dancing and playing the saxophone.\nOption 2: The video shows tango dancing and playing the saxophone.", "gt-answer": "Option 2: The video shows tango dancing and playing the saxophone.", "video-llm-prediction": "Option 2: The video shows tango dancing and playing the saxophone.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video depicts tango dancing and playing the violin.\nSentence B: The video shows tango dancing and playing the saxophone.", "gt-answer": "Sentence B: The video shows tango dancing and playing the saxophone.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1107947873": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The doctor is giving medicine to a patient.\nSentence B: The doctor is writing a prescription.", "gt-answer": "Sentence A: The doctor is giving medicine to a patient.", "video-llm-prediction": "Sentence A: The doctor is giving medicine to a patient.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The doctor is giving medicine to a patient.\nCaption B: The doctor is performing a surgery.", "gt-answer": "Caption A: The doctor is giving medicine to a patient.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The doctor is giving medicine to a patient.\nOption 2: The doctor is checking vitals.", "gt-answer": "Option 1: The doctor is giving medicine to a patient.", "video-llm-prediction": "Option 1: The doctor is giving medicine to a patient.", "match_success": true, "rating": 1 } ] }, "1081194848": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The researcher is teaching children how to dissect a frog.\nOption 2: The researcher is teaching children how to cook a frog.", "gt-answer": "Option 1: The researcher is teaching children how to dissect a frog.", "video-llm-prediction": "Option 1: The researcher is teaching children how to dissect a frog.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The researcher is teaching children how to dissect a frog.\nSentence B: The researcher is teaching children how to feed a frog.", "gt-answer": "Sentence A: The researcher is teaching children how to dissect a frog.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The researcher is teaching children how to dissect a frog.\nCaption B: The researcher is teaching children how to catch a frog.", "gt-answer": "Caption A: The researcher is teaching children how to dissect a frog.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1091526823": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The hand is opening a book.\nSentence B: The hand is turning over pages of a book.", "gt-answer": "Sentence B: The hand is turning over pages of a book.", "video-llm-prediction": "Sentence B.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The hand is turning over pages of a book.\nCaption B: Someone is writing on a book.", "gt-answer": "Caption A: The hand is turning over pages of a book.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The hand is closing a book.\nOption 2: The hand is turning over pages of a book.", "gt-answer": "Option 2: The hand is turning over pages of a book.", "video-llm-prediction": "Option 2: The hand is turning over pages of a book.", "match_success": true, "rating": 1 } ] }, "26631100": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: First, two hand are holding the clay pot and then three hands are holding it.\nSentence B: In the video, three hands are holding the clay pot, then two hands are holding the clay pot.", "gt-answer": "Sentence B: In the video, three hands are holding the clay pot, then two hands are holding the clay pot.", "video-llm-prediction": "Sentence A: First, two hand are holding the clay pot and then three hands are holding it.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: In the video, three hands are holding the clay pot, then two hands are holding the clay pot.\nCaption B: First, two hand are holding the clay pot and then three hands are holding it.", "gt-answer": "Caption A: In the video, three hands are holding the clay pot, then two hands are holding the clay pot.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: First, two hand are holding the clay pot and then three hands are holding it.\nOption 2: In the video, three hands are holding the clay pot, then two hands are holding the clay pot.", "gt-answer": "Option 2: In the video, three hands are holding the clay pot, then two hands are holding the clay pot.", "video-llm-prediction": "Option 1: First, two hand are holding the clay pot and then three hands are holding it.", "match_success": true, "rating": 0 } ] }, "1104663381": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is cutting a pizza dough.\nOption 2: The man is stretching a pizza dough.", "gt-answer": "Option 2: The man is stretching a pizza dough.", "video-llm-prediction": "Option 2: The man is stretching a pizza dough.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A video showing the man folding a pizza dough.\nCaption B: The man is stretching a pizza dough.", "gt-answer": "Caption B: The man is stretching a pizza dough.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is stretching a pizza dough.\nSentence B: The man is cutting a pizza dough.", "gt-answer": "Sentence A: The man is stretching a pizza dough.", "video-llm-prediction": "Sentence A: The man is stretching a pizza dough.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which caption matches the video better?\nCaption A: The pizza dough is rotating counter-clockwise.\nCaption B: The pizza dough is rotating clockwise.", "gt-answer": "Caption A: The pizza dough is rotating counter-clockwise.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The pizza dough is rotating counter-clockwise.\nOption 2: The pizza dough is rotating clockwise.", "gt-answer": "Option 1: The pizza dough is rotating counter-clockwise.", "video-llm-prediction": "Option 1: The pizza dough is rotating counter-clockwise.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The pizza dough is flipping up and down.\nSentence B: The pizza dough is rotating counter-clockwise.", "gt-answer": "Sentence B: The pizza dough is rotating counter-clockwise.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "22100041": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The woman in the video is doing an invitation gesture.\nCaption B: The woman is waving goodbye.", "gt-answer": "Caption A: The woman in the video is doing an invitation gesture.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: She is clapping her hands.\nOption 2: The woman in the video is doing an invitation gesture.", "gt-answer": "Option 2: The woman in the video is doing an invitation gesture.", "video-llm-prediction": "Option 2: The woman in the video is doing an invitation gesture.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is pointing towards something.\nSentence B: The woman in the video is doing an invitation gesture.", "gt-answer": "Sentence B: The woman in the video is doing an invitation gesture.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1103623921": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The man is playing football.\nCaption B: The man is playing pool.", "gt-answer": "Caption B: The man is playing pool.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is playing pool.\nOption 2: The man is sleeping.", "gt-answer": "Option 1: The man is playing pool.", "video-llm-prediction": "Option 1: The man is playing pool.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is dancing.\nSentence B: The man is playing pool.", "gt-answer": "Sentence B: The man is playing pool.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The video is being played at a normal speed.\nOption 2: The video is being played in slow-motion.", "gt-answer": "Option 1: The video is being played at a normal speed.", "video-llm-prediction": "Option 1: The video is being played at a normal speed.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The video is being played at a normal speed.\nCaption B: The video is being fast-forwarded.", "gt-answer": "Caption A: The video is being played at a normal speed.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The video is being played at a normal speed.\nSentence B: The video is stopped.", "gt-answer": "Sentence A: The video is being played at a normal speed.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1093338031": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is trying to punch a computer screen.\nOption 2: The man is attempting to click a computer screen.", "gt-answer": "Option 1: The man is trying to punch a computer screen.", "video-llm-prediction": "Option 2: The man is attempting to click a computer screen.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The man is trying to punch a computer screen.\nCaption B: He is trying to fix a computer screen.", "gt-answer": "Caption A: The man is trying to punch a computer screen.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is cleaning a computer screen.\nSentence B: The man is trying to punch a computer screen.", "gt-answer": "Sentence B: The man is trying to punch a computer screen.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 } ] }, "1064310466": { "action": [ { "question": "Which caption matches the video better?\nCaption A: A man is peeling cocoa seeds.\nCaption B: The man is watering cocoa seeds.", "gt-answer": "Caption A: A man is peeling cocoa seeds.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is planting cocoa seeds.\nSentence B: A man is peeling cocoa seeds.", "gt-answer": "Sentence B: A man is peeling cocoa seeds.", "video-llm-prediction": "Sentence B: A man is peeling cocoa seeds.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A man is baking cocoa seeds.\nOption 2: A man is peeling cocoa seeds.", "gt-answer": "Option 2: A man is peeling cocoa seeds.", "video-llm-prediction": "Option 2: A man is peeling cocoa seeds.", "match_success": true, "rating": 1 } ] }, "1088497853": { "direction": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The movement in the video is upwards.\nOption 2: The movement in the video is leftwards.", "gt-answer": "Option 1: The movement in the video is upwards.", "video-llm-prediction": "Option 1: The movement in the video is upwards.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The camera is moving downwards before the stone building.\nCaption B: The movement in the video is upwards.", "gt-answer": "Caption B: The movement in the video is upwards.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The movement in the video is rightwards.\nSentence B: The movement in the video is upwards.", "gt-answer": "Sentence B: The movement in the video is upwards.", "video-llm-prediction": "Sentence B: The movement in the video is upwards.", "match_success": true, "rating": 1 } ] }, "1106087175": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is taking off a white sneaker.\nSentence B: The man is drawing on a white sneaker.", "gt-answer": "Sentence B: The man is drawing on a white sneaker.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is tying shoelaces on a white sneaker.\nOption 2: The man is drawing on a white sneaker.", "gt-answer": "Option 2: The man is drawing on a white sneaker.", "video-llm-prediction": "Option 1: The man is tying shoelaces on a white sneaker.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The man is wearing a white sneaker.\nCaption B: The man is drawing on a white sneaker.", "gt-answer": "Caption B: The man is drawing on a white sneaker.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "13324343": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is tying his shoelaces and then gliding on the skateboard.\nOption 2: The man is gliding on the skateboard and then tying his shoelaces.", "gt-answer": "Option 1: The man is tying his shoelaces and then gliding on the skateboard.", "video-llm-prediction": "Option 1: The man is tying his shoelaces and then gliding on the skateboard.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is tying his shoelaces and then gliding on the skateboard.\nSentence B: The man is gliding on the skateboard and then tying his shoelaces.", "gt-answer": "Sentence A: The man is tying his shoelaces and then gliding on the skateboard.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is tying his shoelaces and then gliding on the skateboard.\nCaption B: A video showing a man gliding on the skateboard and then tying his shoelaces.", "gt-answer": "Caption A: The man is tying his shoelaces and then gliding on the skateboard.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1083624811": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is performing alternating leg lift plank.\nSentence B: The woman is performing push-ups.", "gt-answer": "Sentence A: The woman is performing alternating leg lift plank.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is performing alternating leg lift plank.\nCaption B: The woman is performing a traditional plank hold.", "gt-answer": "Caption A: The woman is performing alternating leg lift plank.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is performing side plank variations.\nOption 2: The woman is performing alternating leg lift plank.", "gt-answer": "Option 2: The woman is performing alternating leg lift plank.", "video-llm-prediction": "Option 2: The woman is performing alternating leg lift plank.", "match_success": true, "rating": 1 } ] }, "1014976360": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The man first looks at his phone and then takes off his glasses.\nCaption B: The man puts on his glasses and then looks at his phone.", "gt-answer": "Caption A: The man first looks at his phone and then takes off his glasses.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man takes off his glasses and then looks at his phone.\nOption 2: The man first looks at his phone and then takes off his glasses.", "gt-answer": "Option 2: The man first looks at his phone and then takes off his glasses.", "video-llm-prediction": "Option 2: The man first looks at his phone and then takes off his glasses.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man takes off his glasses and then looks at his phone.\nSentence B: The man first looks at his phone and then takes off his glasses.", "gt-answer": "Sentence B: The man first looks at his phone and then takes off his glasses.", "video-llm-prediction": "Sentence B: The man first looks at his phone and then takes off his glasses.", "match_success": true, "rating": 1 } ] }, "18416608": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman first operates her tablet, then samples water in a bottle.\nSentence B: The woman first samples water in a bottle, then operates her tablet.", "gt-answer": "Sentence B: The woman first samples water in a bottle, then operates her tablet.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman first samples water in a bottle, then operates her tablet.\nOption 2: The woman first operates her tablet, then samples water in a bottle.", "gt-answer": "Option 1: The woman first samples water in a bottle, then operates her tablet.", "video-llm-prediction": "Option 2: The woman first operates her tablet, then samples water in a bottle.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The woman first samples water in a bottle, then operates her tablet.\nCaption B: The woman first operates her tablet, then samples water in a bottle.", "gt-answer": "Caption A: The woman first samples water in a bottle, then operates her tablet.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1061351290": { "order": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.\nOption 2: The woman is measuring her belly with a measuring tape and then touching her pregnant belly.", "gt-answer": "Option 1: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.", "video-llm-prediction": "Option 1: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.\nCaption B: The woman is taking off clothes then measuring her belly with a measuring tape.", "gt-answer": "Caption A: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is touching her pregnant belly and then taking off clothes.\nSentence B: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.", "gt-answer": "Sentence B: The woman is touching her pregnant belly and then measuring her belly with a measuring tape.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1066238617": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The woman is practising her punches.\nCaption B: A woman is dancing.", "gt-answer": "Caption A: The woman is practising her punches.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is practising her punches.\nOption 2: She is cooking.", "gt-answer": "Option 1: The woman is practising her punches.", "video-llm-prediction": "Option 1: The woman is practising her punches.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is swimming.\nSentence B: The woman is practising her punches.", "gt-answer": "Sentence B: The woman is practising her punches.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 } ] }, "1072000366": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The girls are elbowing each other.\nOption 2: The girls are giving high fives to each other.", "gt-answer": "Option 1: The girls are elbowing each other.", "video-llm-prediction": "Option 1: The girls are elbowing each other.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: They are waving at each other.\nSentence B: The girls are elbowing each other.", "gt-answer": "Sentence B: The girls are elbowing each other.", "video-llm-prediction": "Sentence A: They are waving at each other.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: The girls are elbowing each other.\nCaption B: The girls are shaking hands.", "gt-answer": "Caption A: The girls are elbowing each other.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1065272113": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The doctor is giving the woman an injection.\nSentence B: The doctor is taking her blood pressure.", "gt-answer": "Sentence A: The doctor is giving the woman an injection.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The doctor is giving the woman an injection.\nCaption B: The doctor is checking her temperature.", "gt-answer": "Caption A: The doctor is giving the woman an injection.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The doctor is applying a bandage.\nOption 2: The doctor is giving the woman an injection.", "gt-answer": "Option 2: The doctor is giving the woman an injection.", "video-llm-prediction": "Option 2: The doctor is giving the woman an injection.", "match_success": true, "rating": 1 } ] }, "1072971926": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is wrapping the pizza box.\nSentence B: The man is opening the pizza box.", "gt-answer": "Sentence B: The man is opening the pizza box.", "video-llm-prediction": "Sentence A: The man is wrapping the pizza box.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: A video showing a person eating the pizza.\nCaption B: The man is opening the pizza box.", "gt-answer": "Caption B: The man is opening the pizza box.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is opening the pizza box.\nOption 2: The man is closing the pizza box.", "gt-answer": "Option 1: The man is opening the pizza box.", "video-llm-prediction": "Option 1: The man is opening the pizza box.", "match_success": true, "rating": 1 } ] }, "3399348431": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is mixing the sauce with the vegetables.\nSentence B: A person is squeezing the sauce into a bowl of vegetables.", "gt-answer": "Sentence B: A person is squeezing the sauce into a bowl of vegetables.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A video showing dipping vegetables on the sauce.\nOption 2: A person is squeezing the sauce into a bowl of vegetables.", "gt-answer": "Option 2: A person is squeezing the sauce into a bowl of vegetables.", "video-llm-prediction": "Option 2: A person is squeezing the sauce into a bowl of vegetables.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A person is mixing sauce with the vegetables.\nCaption B: A person is squeezing the sauce into a bowl of vegetables.", "gt-answer": "Caption B: A person is squeezing the sauce into a bowl of vegetables.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1025137214": { "action": [ { "question": "Which caption matches the video better?\nCaption A: A man is walking.\nCaption B: A man is smoking a cigarette.", "gt-answer": "Caption B: A man is smoking a cigarette.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is talking on the phone.\nSentence B: A man is smoking a cigarette.", "gt-answer": "Sentence B: A man is smoking a cigarette.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is reading a book.\nOption 2: A man is smoking a cigarette.", "gt-answer": "Option 2: A man is smoking a cigarette.", "video-llm-prediction": "Option 2: A man is smoking a cigarette.", "match_success": true, "rating": 1 } ] }, "1033101626": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The man is cooking.\nCaption B: The man is playing an instrument.", "gt-answer": "Caption B: The man is playing an instrument.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is playing an instrument.\nOption 2: A video showing the man singing.", "gt-answer": "Option 1: The man is playing an instrument.", "video-llm-prediction": "Option 1: The man is playing an instrument.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is playing an instrument.\nSentence B: The man is reading.", "gt-answer": "Sentence A: The man is playing an instrument.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "9537677": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The woman is reading a book.\nCaption B: The woman is engaged in playing a tablet.", "gt-answer": "Caption B: The woman is engaged in playing a tablet.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is engaged in playing a tablet.\nOption 2: A video showing the woman watching TV.", "gt-answer": "Option 1: The woman is engaged in playing a tablet.", "video-llm-prediction": "Option 1: The woman is engaged in playing a tablet.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is engaged in playing a tablet.\nSentence B: The woman is dancing.", "gt-answer": "Sentence A: The woman is engaged in playing a tablet.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1077388994": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is singing.\nOption 2: The woman is patting the baby.", "gt-answer": "Option 2: The woman is patting the baby.", "video-llm-prediction": "Option 2: The woman is patting the baby.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is patting the baby.\nSentence B: A person dancing.", "gt-answer": "Sentence A: The woman is patting the baby.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: She is cooking dinner.\nCaption B: The woman is patting the baby.", "gt-answer": "Caption B: The woman is patting the baby.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1037531786": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The two men are boxing.\nOption 2: The two men are dancing.", "gt-answer": "Option 1: The two men are boxing.", "video-llm-prediction": "Option 1: The two men are boxing.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The two men are cooking.\nCaption B: The two men are boxing.", "gt-answer": "Caption B: The two men are boxing.", "video-llm-prediction": "Caption B: The two men are boxing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The two men are painting.\nSentence B: The two men are boxing.", "gt-answer": "Sentence B: The two men are boxing.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1077275024": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The girl is jumping with a man playing ukulele.\nOption 2: The girl is clapping hands for a man playing ukulele.", "gt-answer": "Option 2: The girl is clapping hands for a man playing ukulele.", "video-llm-prediction": "Option 2: The girl is clapping hands for a man playing ukulele.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The girl is clapping hands for a man playing ukulele.\nCaption B: The girl is dancing with a man playing ukulele.", "gt-answer": "Caption A: The girl is clapping hands for a man playing ukulele.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The girl is clapping hands for a man playing ukulele.\nSentence B: The girl is sitting and watching a man play the ukulele.", "gt-answer": "Sentence A: The girl is clapping hands for a man playing ukulele.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1107180099": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The women are singing.\nCaption B: The women are dancing.", "gt-answer": "Caption B: The women are dancing.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The women are dancing.\nOption 2: The women are painting.", "gt-answer": "Option 1: The women are dancing.", "video-llm-prediction": "Option 1: The women are dancing.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The women are dancing.\nSentence B: The women are cooking.", "gt-answer": "Sentence A: The women are dancing.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 } ] }, "1049434159": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The parents and daughter are cooking dinner.\nOption 2: The parents and daughter are playing video games together.", "gt-answer": "Option 2: The parents and daughter are playing video games together.", "video-llm-prediction": "Option 2: The parents and daughter are playing video games together.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The parents and daughter are playing video games together.\nCaption B: A family engagement in reading a book.", "gt-answer": "Caption A: The parents and daughter are playing video games together.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: They are hiking together.\nSentence B: The parents and daughter are playing video games together.", "gt-answer": "Sentence B: The parents and daughter are playing video games together.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "3402234027": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The cat is sleeping.\nOption 2: The cat is eating food.", "gt-answer": "Option 2: The cat is eating food.", "video-llm-prediction": "Option 2: The cat is eating food.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The cat is eating food.\nSentence B: A video showing the cat playing with a toy.", "gt-answer": "Sentence A: The cat is eating food.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The cat is swimming.\nCaption B: The cat is eating food.", "gt-answer": "Caption B: The cat is eating food.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1056491306": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: Passengers are taking a seat on the subway.\nSentence B: Passengers are sleeping on the bed.", "gt-answer": "Sentence A: Passengers are taking a seat on the subway.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: Passengers are taking a seat on the subway.\nOption 2: Passengers are standing in a room.", "gt-answer": "Option 1: Passengers are taking a seat on the subway.", "video-llm-prediction": "Option 1: Passengers are taking a seat on the subway.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: Passengers are taking a seat on the subway.\nCaption B: Passengers are dancing on the stage.", "gt-answer": "Caption A: Passengers are taking a seat on the subway.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 } ] }, "1012085909": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The people are rolling boats on the lake.\nSentence B: The people in the video are pushing bikes.", "gt-answer": "Sentence B: The people in the video are pushing bikes.", "video-llm-prediction": "Sentence B: The people in the video are pushing bikes.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A group of people walking on the street.\nCaption B: The people in the video are pushing bikes.", "gt-answer": "Caption B: The people in the video are pushing bikes.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The people in the video are pushing bikes.\nOption 2: The people are swimming.", "gt-answer": "Option 1: The people in the video are pushing bikes.", "video-llm-prediction": "Option 1: The people in the video are pushing bikes.", "match_success": true, "rating": 1 } ] }, "1079406734": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: A man is washing the car in the video.\nOption 2: The man is riding bikes.", "gt-answer": "Option 1: A man is washing the car in the video.", "video-llm-prediction": "Option 1: A man is washing the car in the video.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A man is washing the car in the video.\nSentence B: The man is taking a shower.", "gt-answer": "Sentence A: A man is washing the car in the video.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is driving the car.\nCaption B: A man is washing the car in the video.", "gt-answer": "Caption B: A man is washing the car in the video.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1022115337": { "order": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The order of events is sending an air kiss first and then dancing.\nSentence B: The order of events is dancing first and then sending an air kiss.", "gt-answer": "Sentence B: The order of events is dancing first and then sending an air kiss.", "video-llm-prediction": "Sentence A: The order of events is sending an air kiss first and then dancing.", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The order of events is dancing first and then sending an air kiss.\nOption 2: The order of events is sending an air kiss first and then dancing.", "gt-answer": "Option 1: The order of events is dancing first and then sending an air kiss.", "video-llm-prediction": "Option 1: The order of events is dancing first and then sending an air kiss.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The girl is dancing first and then sending an air kiss.\nCaption B: The girl is sending an air kiss first and then dancing.", "gt-answer": "Caption A: The girl is dancing first and then sending an air kiss.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 0 } ] }, "1071214909": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: A person is drawing a cutting line on a wood surface.\nSentence B: The person is carving a design on the wood surface.", "gt-answer": "Sentence A: A person is drawing a cutting line on a wood surface.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: A video showing a person measuring the length on a wood surface.\nCaption B: A person is drawing a cutting line on a wood surface.", "gt-answer": "Caption B: A person is drawing a cutting line on a wood surface.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The person is sanding the surface of the wood.\nOption 2: A person is drawing a cutting line on a wood surface.", "gt-answer": "Option 2: A person is drawing a cutting line on a wood surface.", "video-llm-prediction": "Option 2: A person is drawing a cutting line on a wood surface.", "match_success": true, "rating": 1 } ] }, "1092065543": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is eating.\nSentence B: The man is shopping.", "gt-answer": "Sentence B: The man is shopping.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is shopping.\nCaption B: The man is sleeping.", "gt-answer": "Caption A: The man is shopping.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The man is running.\nOption 2: The man is shopping.", "gt-answer": "Option 2: The man is shopping.", "video-llm-prediction": "Option 2: The man is shopping.", "match_success": true, "rating": 1 } ] }, "1017063703": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The person is baking cakes.\nCaption B: A person in the video is decorating cakes.", "gt-answer": "Caption B: A person in the video is decorating cakes.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A person in the video is decorating cakes.\nSentence B: The person is cutting cakes.", "gt-answer": "Sentence A: A person in the video is decorating cakes.", "video-llm-prediction": "Sentence A: A person in the video is decorating cakes.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A video showing someone presenting cakes to guests.\nOption 2: A person in the video is decorating cakes.", "gt-answer": "Option 2: A person in the video is decorating cakes.", "video-llm-prediction": "Option 2: A person in the video is decorating cakes.", "match_success": true, "rating": 1 } ] }, "1055022287": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The man in the video is cooking.\nCaption B: The man in the video is cleaning a swimming pool.", "gt-answer": "Caption B: The man in the video is cleaning a swimming pool.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: A person in the video is singing.\nOption 2: The man in the video is cleaning a swimming pool.", "gt-answer": "Option 2: The man in the video is cleaning a swimming pool.", "video-llm-prediction": "Option 2: The man in the video is cleaning a swimming pool.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man in the video is cleaning a swimming pool.\nSentence B: The man is playing basketball.", "gt-answer": "Sentence A: The man in the video is cleaning a swimming pool.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 1 } ] }, "1094259081": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The woman is watching a VR movie.\nSentence B: A woman is playing a VR shooting game in the video.", "gt-answer": "Sentence B: A woman is playing a VR shooting game in the video.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 0 }, { "question": "Which caption matches the video better?\nCaption A: A woman is playing a VR shooting game in the video.\nCaption B: She is listening to music using VR.", "gt-answer": "Caption A: A woman is playing a VR shooting game in the video.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The woman is working out using VR.\nOption 2: A woman is playing a VR shooting game in the video.", "gt-answer": "Option 2: A woman is playing a VR shooting game in the video.", "video-llm-prediction": "Option 1: The woman is working out using VR.", "match_success": true, "rating": 0 } ] }, "1022260408": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The squirrel is sleeping.\nCaption B: The squirrel is eating food.", "gt-answer": "Caption B: The squirrel is eating food.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: A video showing a squirrel running.\nSentence B: The squirrel is eating food.", "gt-answer": "Sentence B: The squirrel is eating food.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The squirrel is chasing its tail.\nOption 2: The squirrel is eating food.", "gt-answer": "Option 2: The squirrel is eating food.", "video-llm-prediction": "Option 2: The squirrel is eating food.", "match_success": true, "rating": 1 } ] }, "1089810969": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The little girl runs towards the woman and hugs her.\nCaption B: The little girl walks towards the woman and hugs her.", "gt-answer": "Caption A: The little girl runs towards the woman and hugs her.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The little girl runs towards the woman and jumps on her back.\nSentence B: The little girl runs towards the woman and hugs her.", "gt-answer": "Sentence B: The little girl runs towards the woman and hugs her.", "video-llm-prediction": "Sentence A", "match_success": true, "rating": 0 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The little girl runs towards the woman and talks to her.\nOption 2: The little girl runs towards the woman and hugs her.", "gt-answer": "Option 2: The little girl runs towards the woman and hugs her.", "video-llm-prediction": "Option 2: The little girl runs towards the woman and hugs her.", "match_success": true, "rating": 1 } ] }, "6165731": { "action": [ { "question": "Which sentence better captures the essence of the video?\nSentence A: The scientist is looking confused and frustrated about the experiment.\nSentence B: The scientist is observing quietly on the experiment.", "gt-answer": "Sentence A: The scientist is looking confused and frustrated about the experiment.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The scientist is looking confused and frustrated about the experiment.\nOption 2: The scientist is leisurely conducting experiments.", "gt-answer": "Option 1: The scientist is looking confused and frustrated about the experiment.", "video-llm-prediction": "Option 1: The scientist is looking confused and frustrated about the experiment.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The scientist feels excited and motivated about the experiment.\nCaption B: The scientist is looking confused and frustrated about the experiment.", "gt-answer": "Caption B: The scientist is looking confused and frustrated about the experiment.", "video-llm-prediction": "Caption A", "match_success": true, "rating": 0 } ] }, "1111469465": { "action": [ { "question": "Which description is a more suitable match for the video?\nOption 1: The man is raising his arm to look at the watch and he appears anxious.\nOption 2: The man is raising his arm to look at the watch and he looks happy.", "gt-answer": "Option 1: The man is raising his arm to look at the watch and he appears anxious.", "video-llm-prediction": "Option 1: The man is raising his arm to look at the watch and he appears anxious.", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man is raising his arm to look at the watch and he appears anxious.\nSentence B: The man is raising his arm to look at the watch and he looks calm.", "gt-answer": "Sentence A: The man is raising his arm to look at the watch and he appears anxious.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which caption matches the video better?\nCaption A: The man is putting his hands in his pockets and he looks anxious.\nCaption B: The man is raising his arm to look at the watch and he appears anxious.", "gt-answer": "Caption B: The man is raising his arm to look at the watch and he appears anxious.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 } ] }, "1050000214": { "action": [ { "question": "Which caption matches the video better?\nCaption A: The little child is running.\nCaption B: The little child is performing water jumping.", "gt-answer": "Caption B: The little child is performing water jumping.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The little child is swimming.\nSentence B: The little child is performing water jumping.", "gt-answer": "Sentence B: The little child is performing water jumping.", "video-llm-prediction": "Sentence B", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The little child is dancing.\nOption 2: The little child is performing water jumping.", "gt-answer": "Option 2: The little child is performing water jumping.", "video-llm-prediction": "Option 2: The little child is performing water jumping.", "match_success": true, "rating": 1 } ] }, "27537016": { "order": [ { "question": "Which caption matches the video better?\nCaption A: The man pulls back inside the car and then shows off his car key.\nCaption B: The man first shows off his car key, then pulls back inside the car.", "gt-answer": "Caption B: The man first shows off his car key, then pulls back inside the car.", "video-llm-prediction": "Caption B", "match_success": true, "rating": 1 }, { "question": "Which sentence better captures the essence of the video?\nSentence A: The man first shows off his car key, then pulls back inside the car.\nSentence B: After pulling back inside the car, the man shows off his car key.", "gt-answer": "Sentence A: The man first shows off his car key, then pulls back inside the car.", "video-llm-prediction": "Sentence A.", "match_success": true, "rating": 1 }, { "question": "Which description is a more suitable match for the video?\nOption 1: The correct order of actions by the man is throwing away his car key, then pulling back inside the car.\nOption 2: The man first shows off his car key, then pulls back inside the car.", "gt-answer": "Option 2: The man first shows off his car key, then pulls back inside the car.", "video-llm-prediction": "Option 1: The correct order of actions by the man is throwing away his car key, then pulling back inside the car.", "match_success": true, "rating": 0 } ] } }, "multi-choice": { "1034419625": { "action": [ { "question": "What is the man doing in the video?\nA. dunking a basketball\nB. dribbling a basketball\nC. passing a basketball", "gt-answer": "A. dunking a basketball", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which activity is the man engaged in?\nA. passing a basketball\nB. dribbling a basketball\nC. dunking a basketball", "gt-answer": "C. dunking a basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is the man performing?\nA. dribbling a basketball\nB. dunking a basketball\nC. passing a basketball", "gt-answer": "B. dunking a basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following actions describes the man?\nA. dribbling a basketball\nB. passing a basketball\nC. dunking a basketball", "gt-answer": "C. dunking a basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "What is the direction of the man?\nA. moving towards the camera\nB. moving from left to right\nC. moving away from the camera", "gt-answer": "B. moving from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "From the camera's point of view, in which direction is the man moving?\nA. away from the camera\nB. towards the camera\nC. from left to right", "gt-answer": "C. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the camera's position, which way is the man headed?\nA. from left to right\nB. towards the camera\nC. from right to left", "gt-answer": "A. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1034419625_reverse": { "direction": [ { "question": "What is the direction of the man?\nA. moving towards the camera\nB. moving from right to left\nC. moving away from the camera\nD. moving from left to right", "gt-answer": "B. moving from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "From the camera's point of view, in which direction is the man moving?\nA. away from the camera\nB. towards the camera\nC. from right to left\nD. from left to right", "gt-answer": "C. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the camera's position, which way is the man headed?\nA. from right to left\nB. towards the camera\nC. from left to right\nD. away from the camera", "gt-answer": "A. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1094590221": { "action": [ { "question": "What is the man doing in the video?\nA. dribbling basketball\nB. passing basketball\nC. shooting basketball\nD. dunking basketball", "gt-answer": "C. shooting basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity is depicted in the video?\nA. shooting basketball\nB. dribbling basketball\nC. dunking basketball\nD. passing basketball", "gt-answer": "A. shooting basketball", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which action is being performed by the man?\nA. dunking basketball\nB. dribbling basketball\nC. painting\nD. shooting basketball", "gt-answer": "D. shooting basketball", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the main action of the man in the video?\nA. dribbling basketball\nB. shooting basketball\nC. dunking basketball\nD. passing basketball", "gt-answer": "B. shooting basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what is the man engaged in?\nA. passing basketball\nB. shooting basketball\nC. dunking basketball\nD. dribbling basketball", "gt-answer": "B. shooting basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "What direction is the basketball moving?\nA. straight ahead\nB. left to right\nC. right to left", "gt-answer": "C. right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the basketball move in the horizontal direction?\nA. left to right\nB. right to left\nC. standing still", "gt-answer": "B. right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "From which side of the screen does the basketball ends moving?\nA. right top\nB. right bottom\nC. left bottom\nD. left top", "gt-answer": "C. left bottom", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1094590221_reverse": { "direction": [ { "question": "What direction is the basketball moving?\nA. straight ahead\nB. left to right\nC. right to left", "gt-answer": "B. left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the basketball move in the horizontal direction?\nA. left to right\nB. right to left\nC. standing still", "gt-answer": "A. left to right", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "From which side of the screen does the basketball start moving?\nA. right top\nB. right bottom\nC. left bottom\nD. left top", "gt-answer": "C. left bottom", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1098982673": { "action": [ { "question": "What is the woman doing?\nA. Eating and singing\nB. Dancing and singing\nC. Sleeping and singing\nD. Running and singing", "gt-answer": "B. Dancing and singing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be observed about the woman?\nA. She is cooking meal\nB. She is dancing and singing\nC. She is washing dishes\nD. She is walking", "gt-answer": "B. She is dancing and singing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what actions is the woman involved in?\nA. Cooking\nB. Jumping\nC. Dancing and singing\nD. Doing laundry", "gt-answer": "C. Dancing and singing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. slow motion\nC. fast forward\nD. reverse", "gt-answer": "A. normal speed", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "How fast is the video playing?\nA. 2x speed\nB. 1x speed\nC. 10x speed\nD. 0.5x speed", "gt-answer": "B. 1x speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which speed setting does the video appear to be at?\nA. fluctuating speed\nB. real-time speed\nC. decelerated speed\nD. accelerated speed", "gt-answer": "B. real-time speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what pace is the video running?\nA. rapid pace\nB. leisure pace\nC. standard pace\nD. sporadic pace", "gt-answer": "C. standard pace", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the tempo of the video?\nA. erratic tempo\nB. moderate tempo\nC. brisk tempo\nD. sluggish tempo", "gt-answer": "B. moderate tempo", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1111657885": { "action": [ { "question": "What are the people doing?\nA. skiing\nB. ice skating\nC. swimming", "gt-answer": "B. ice skating", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What sport are the people engaged in?\nA. tennis\nB. soccer\nC. ice skating", "gt-answer": "C. ice skating", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity can be observed in the video?\nA. dancing\nB. painting\nC. ice skating", "gt-answer": "C. ice skating", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action are the people performing?\nA. ice skating\nB. playing guitar\nC. playing basketball", "gt-answer": "A. ice skating", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the action being performed by the individuals?\nA. ice skating\nB. yoga\nC. running", "gt-answer": "A. ice skating", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the tempo of the video?\nA. rapid pace\nB. slow motion\nC. normal speed", "gt-answer": "B. slow motion", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How is the entire video presented?\nA. pause\nB. fast forward\nC. slow motion", "gt-answer": "C. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In which speed mode is the video playing?\nA. real-time speed\nB. slow motion\nC. accelerated\nD. standing still", "gt-answer": "B. slow motion", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which direction are the people skating?\nA. towards the camera\nB. parallel to the screen\nC. away from the camera", "gt-answer": "A. towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction are the people moving?\nA. standing still\nB. towards the camera\nC. from right to left in relation to the camera\nD. away from the camera", "gt-answer": "B. towards the camera", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "How would you describe the movement of the people?\nA. gliding away from the camera\nB. gliding towards the camera\nC. gliding parallel the camera", "gt-answer": "B. gliding towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1111657885_reverse": { "direction": [ { "question": "Which direction are the people skating?\nA. towards the camera\nB. parallel to the screen\nC. away from the camera", "gt-answer": "C. away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction are the people moving?\nA. standing still\nB. towards the camera\nC. from right to left in relation to the camera\nD. away from the camera", "gt-answer": "D. away from the camera", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "How would you describe the movement of the people?\nA. gliding away from the camera\nB. gliding towards the camera\nC. gliding parallel the camera", "gt-answer": "A. gliding away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1073873933": { "action": [ { "question": "What is happening in the video?\nA. eating\nB. fighting\nC. sleeping\nD. dancing", "gt-answer": "B. fighting", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity is the monkey engaged in?\nA. swimming\nB. running\nC. climbing\nD. fighting", "gt-answer": "D. fighting", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the main action of the monkey?\nA. reading\nB. hiding\nC. painting\nD. fighting", "gt-answer": "D. fighting", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which action is depicted by the monkey?\nA. singing\nB. fighting\nC. knitting\nD. playing chess", "gt-answer": "B. fighting", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity is the monkey participating in?\nA. fishing\nB. skiing\nC. shopping\nD. fighting", "gt-answer": "D. fighting", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1089810425": { "action": [ { "question": "What are the people doing?\nA. cooking\nB. sleeping\nC. dancing", "gt-answer": "C. dancing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity are the people engaged in?\nA. swimming\nB. dancing\nC. painting", "gt-answer": "B. dancing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action are the people performing?\nA. singing\nB. dancing\nC. reading", "gt-answer": "B. dancing", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the activity of the people?\nA. dancing\nB. running\nC. studying", "gt-answer": "A. dancing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What are the people participating in?\nA. dancing\nB. knitting\nC. playing football", "gt-answer": "A. dancing", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. slow motion\nB. normal speed\nC. time-lapse", "gt-answer": "B. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the tempo of the entire video?\nA. slow\nB. regular\nC. fast", "gt-answer": "B. regular", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the rate of the video?\nA. moderate speed\nB. low speed\nC. high speed", "gt-answer": "A. moderate speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What is the direction of the panning in the video?\nA. left to right\nB. right to left\nC. up and down\nD. circular motion", "gt-answer": "B. right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement of the camera in the video?\nA. panning from right to left\nB. zooming in\nC. zooming out\nD. panning from left to right", "gt-answer": "A. panning from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which way is the video shifting?\nA. horizontal\nB. diagonal\nC. vertical", "gt-answer": "A. horizontal", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction is the camera moving?\nA. leftward\nB. upward\nC. downward\nD. rightward", "gt-answer": "A. leftward", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1089810425_reverse": { "direction": [ { "question": "What is the direction of the panning in the video?\nA. left to right\nB. right to left\nC. up and down\nD. circular motion", "gt-answer": "A. left to right", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the movement of the camera in the video?\nA. panning from right to left\nB. zooming in\nC. zooming out\nD. panning from left to right", "gt-answer": "D. panning from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the video shifting?\nA. horizontal\nB. diagonal\nC. vertical", "gt-answer": "A. horizontal", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction is the camera moving?\nA. leftward\nB. upward\nC. downward\nD. rightward", "gt-answer": "D. rightward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077507593": { "action": [ { "question": "What are the people doing in the video?\nA. sleeping\nB. eating\nC. dancing\nD. cooking", "gt-answer": "D. cooking", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which activity can be seen in the video?\nA. painting\nB. reading\nC. cooking\nD. swimming", "gt-answer": "C. cooking", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the action being performed by the individuals?\nA. writing\nB. singing\nC. running\nD. cooking", "gt-answer": "D. cooking", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What can you observe the people doing in the footage?\nA. playing sports\nB. studying\nC. cooking\nD. shopping", "gt-answer": "C. cooking", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which verb best describes the action of the people?\nA. sleeping\nB. cooking\nC. talking\nD. driving", "gt-answer": "B. cooking", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. slow motion\nC. time-lapse", "gt-answer": "B. slow motion", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the rate at which the events are happening in the video?\nA. gradual\nB. fast\nC. slow", "gt-answer": "C. slow", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the tempo of the video?\nA. slow tempo\nB. rapid tempo\nC. moderate tempo", "gt-answer": "A. slow tempo", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How would you describe the pace of the video?\nA. medium-paced\nB. quick-paced\nC. slow-paced", "gt-answer": "C. slow-paced", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "order": [ { "question": "Which event happens first to the skillet?\nA. Burning in fire\nB. None of both\nC. Smoking", "gt-answer": "C. Smoking", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the sequence of events for the skillet?\nA. Smoking, and then burning in fire\nB. Burning in fire, and then smoking\nC. Smoking without burning in fire", "gt-answer": "A. Smoking, and then burning in fire", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "When does the skillet smoke?\nA. After burning in fire\nB. The skillet doesn't smoke\nC. Before burning in fire", "gt-answer": "C. Before burning in fire", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what order do the events occur with the skillet?\nA. Smoking, followed by burning in fire\nB. Burning in fire, followed by smoking\nC. Both events happen simultaneously", "gt-answer": "B. Burning in fire, followed by smoking", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1107116885": { "action": [ { "question": "What activity is the man engaged in?\nA. swimming\nB. shooting an arrow\nC. running", "gt-answer": "B. shooting an arrow", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which sport is the man participating in?\nA. soccer\nB. archery\nC. basketball", "gt-answer": "B. archery", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What action is being performed by the man?\nA. dancing\nB. shooting an arrow\nC. singing", "gt-answer": "B. shooting an arrow", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the man doing with the bow?\nA. throwing it away\nB. playing it like a guitar\nC. shooting an arrow", "gt-answer": "C. shooting an arrow", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In the given footage, what is the man involved in?\nA. cooking\nB. painting\nC. shooting an arrow", "gt-answer": "C. shooting an arrow", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the pace of the video?\nA. time-lapse\nB. accelerated speed\nC. slow motion\nD. normal speed", "gt-answer": "D. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How fast is the video playing?\nA. at an average speed\nB. with time-lapse effect\nC. in slow motion\nD. at a rapid speed", "gt-answer": "A. at an average speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which speed setting is applied to the entire video?\nA. fast-forward\nB. normal speed\nC. slow motion\nD. time-lapse", "gt-answer": "B. normal speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "At what rate is the video playing?\nA. with a time warp\nB. slowly\nC. rapidly\nD. normally", "gt-answer": "D. normally", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the tempo of the video?\nA. speeded-up\nB. regular\nC. quick\nD. sluggish", "gt-answer": "B. regular", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059718130": { "speed": [ { "question": "What is the speed of the video?\nA. slow motion\nB. normal speed\nC. time-lapse\nD. stop motion", "gt-answer": "C. time-lapse", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the pace at which the video is playing?\nA. fast-forward\nB. slow motion\nC. real-time", "gt-answer": "A. fast-forward", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "At what rate does the video progress?\nA. slow motion\nB. normal speed\nC. time-lapse\nD. reverse motion", "gt-answer": "C. time-lapse", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What direction is the sun moving in?\nA. falling\nB. rising\nC. staying in one place", "gt-answer": "B. rising", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the direction of the sun?\nA. stationary\nB. falling\nC. rising", "gt-answer": "C. rising", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the primary movement of the sun?\nA. descending\nB. standing still\nC. rising", "gt-answer": "C. rising", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the video's brightness?\nA. getting darker\nB. staying the same\nC. turning brighter", "gt-answer": "C. turning brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the attribute of brightness changing?\nA. remaining stable\nB. increasing\nC. decreasing", "gt-answer": "B. increasing", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What transformation is occurring in the brightness of the video?\nA. remaining constant\nB. brightening\nC. dimming", "gt-answer": "B. brightening", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059718130_reverse": { "direction": [ { "question": "What direction is the sun moving in?\nA. setting\nB. rising\nC. staying in one place", "gt-answer": "A. setting", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the direction of the sun?\nA. stationary\nB. falling\nC. rising", "gt-answer": "B. falling", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the primary movement of the sun?\nA. descending\nB. standing still\nC. rising", "gt-answer": "A. descending", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the video's brightness?\nA. getting darker\nB. staying the same\nC. turning brighter", "gt-answer": "A. getting darker", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the attribute of brightness changing?\nA. remaining stable\nB. increasing\nC. decreasing", "gt-answer": "C. decreasing", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What transformation is occurring in the brightness of the video?\nA. remaining constant\nB. brightening\nC. dimming", "gt-answer": "C. dimming", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1083845854": { "speed": [ { "question": "What speed is the video playing at?\nA. time-lapse\nB. slow motion\nC. normal speed", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "The video is playing at which speed?\nA. slow motion\nB. normal speed\nC. fast-forward", "gt-answer": "C. fast-forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which word describes the speed of the video?\nA. time-lapse\nB. normal\nC. backwards\nD. double", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "At what rate is the video progressing?\nA. slow motion\nB. time-lapse\nC. normal speed", "gt-answer": "B. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "What is the direction in which the clock hands are moving?\nA. counterclockwise\nB. clockwise\nC. stationary", "gt-answer": "B. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the clock hands changing their orientation?\nA. standing still\nB. moving clockwise\nC. moving anti-clockwise", "gt-answer": "B. moving clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In what direction are the clock hands moving?\nA. clockwise\nB. alternating between clockwise and counterclockwise\nC. counterclockwise", "gt-answer": "A. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1083845854_reverse": { "direction": [ { "question": "What is the direction in which the clock hands are moving?\nA. counterclockwise\nB. clockwise\nC. stationary", "gt-answer": "A. counterclockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How are the clock hands changing their orientation?\nA. standing still\nB. moving clockwise\nC. moving anti-clockwise", "gt-answer": "C. moving anti-clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In what direction are the clock hands moving?\nA. clockwise\nB. alternating between clockwise and counterclockwise\nC. counterclockwise", "gt-answer": "C. counterclockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1050618460": { "speed": [ { "question": "What is the speed of the entire video?\nA. normal speed\nB. time-lapse\nC. slow motion", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How would you describe the pace of the entire video?\nA. fast-paced\nB. slow-paced\nC. medium-paced", "gt-answer": "A. fast-paced", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "How does the entire video appear in terms of tempo?\nA. rapidly\nB. moderately\nC. leisurely", "gt-answer": "A. rapidly", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the flowers?\nA. turning into buds\nB. shrinking and wilting\nC. turning into full bloom\nD. remaining as buds", "gt-answer": "C. turning into full bloom", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How do the flowers transform?\nA. from stem to leaf\nB. from full bloom to bud\nC. from seed to germination\nD. from bud to full bloom", "gt-answer": "D. from bud to full bloom", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What happens when the flowers go through the attribute_change?\nA. reaching full maturity\nB. shedding leaves\nC. sprouting more buds\nD. shrinking into buds", "gt-answer": "A. reaching full maturity", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1083113449": { "speed": [ { "question": "What is the speed of the video?\nA. slow motion\nB. time-lapse\nC. normal speed", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What type of speed is applied to the video?\nA. rewind\nB. time-lapse\nC. slow ", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What effect is applied to the video's speed?\nA. time-lapse\nB. normal speed\nC. slow motion", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what way is the speed altered in the video?\nA. normal speed\nB. time-lapse\nC. slow motion", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "How would you describe the change in the sky's appearance?\nA. lightening up\nB. maintaining its brightness\nC. getting darker", "gt-answer": "C. getting darker", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is occurring to the sky?\nA. staying the same\nB. getting darker\nC. brightening", "gt-answer": "B. getting darker", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In terms of illumination, what is happening to the sky?\nA. becoming brighter\nB. growing dimmer\nC. remaining unchanged", "gt-answer": "B. growing dimmer", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1091143117": { "speed": [ { "question": "What is the speed of the video?\nA. time-lapse\nB. slow motion\nC. normal speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following describes the velocity of the video?\nA. fast-forward\nB. regular\nC. backwards", "gt-answer": "B. regular", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which word best captures the pace of the video?\nA. speedy\nB. real-time speed\nC. fast-paced", "gt-answer": "B. real-time speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the eye?\nA. from closed to open\nB. turning red\nC. becoming blurry\nD. from open to closed", "gt-answer": "A. from closed to open", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the eye changing?\nA. changing color\nB. from closed to open\nC. becoming smaller\nD. from open to closed", "gt-answer": "B. from closed to open", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What transformation is occurring in the eye?\nA. from open to closed\nB. shrinking\nC. from closed to open\nD. blinking", "gt-answer": "C. from closed to open", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100329207": { "action": [ { "question": "What is the sheep doing?\nA. running\nB. sleeping\nC. eating grass", "gt-answer": "A. running", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which of the following actions is the sheep engaged in?\nA. swimming\nB. flying\nC. running", "gt-answer": "C. running", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what action can be seen performed by the sheep?\nA. running\nB. knitting\nC. typing on a keyboard", "gt-answer": "A. running", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "From the given information, which action is being exhibited by the sheep?\nA. dancing\nB. running\nC. reading a book", "gt-answer": "B. running", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the activity showcased in the video involving the sheep?\nA. painting\nB. running\nC. playing a musical instrument", "gt-answer": "B. running", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "What is the direction of the camera view?\nA. moving right\nB. moving backward\nC. moving left\nD. moving forward", "gt-answer": "D. moving forward", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "In which direction is the video panning?\nA. up\nB. down\nC. backward\nD. forward", "gt-answer": "D. forward", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the direction of the camera movement?\nA. moving forward\nB. tilting up\nC. tilting down\nD. moving backward", "gt-answer": "A. moving forward", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. fast forward\nB. normal speed\nC. reverse speed\nD. super slow motion", "gt-answer": "B. normal speed", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which option describes the rate at which the video is playing?\nA. accelerated\nB. normal speed\nC. super slow motion\nD. fast-paced", "gt-answer": "B. normal speed", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the tempo of the video?\nA. paused\nB. sped up\nC. slowed down\nD. regular pace", "gt-answer": "D. regular pace", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1089201973": { "action": [ { "question": "What are the people doing in the video?\nA. stopping football\nB. kicking football\nC. throwing football\nD. spinning football", "gt-answer": "B. kicking football", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity are the people engaged in?\nA. stopping football\nB. kicking football\nC. spinning football\nD. throwing football", "gt-answer": "B. kicking football", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action are the people performing?\nA. kicking football\nB. throwing football\nC. spinning football\nD. stopping football", "gt-answer": "A. kicking football", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the movement of the people?\nA. stopping football\nB. kicking football\nC. throwing football\nD. spinning football", "gt-answer": "B. kicking football", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which sport are the people participating in?\nA. kicking football\nB. stopping football\nC. throwing football\nD. spinning football", "gt-answer": "A. kicking football", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. time-lapse\nC. slow motion", "gt-answer": "C. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the pace at which the video is playing?\nA. rapid speed\nB. slow motion\nC. moderate speed", "gt-answer": "B. slow motion", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "At what rate is the video being played?\nA. slow motion\nB. fast speed\nC. regular speed", "gt-answer": "A. slow motion", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What term describes the tempo of the video?\nA. high speed\nB. slow motion\nC. standard speed", "gt-answer": "B. slow motion", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which word best describes the velocity of the video?\nA. regular speed\nB. slow motion\nC. swift speed", "gt-answer": "B. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ], "direction": [ { "question": "What is the direction of the football in the video?\nA. moving from left to right\nB. moving from right to left\nC. stationary", "gt-answer": "A. moving from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the football traveling?\nA. Rightwards\nB. Upwards\nC. Leftwards\nD. Downwards", "gt-answer": "A. Rightwards", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How would you describe the path of the football?\nA. from bottom to top\nB. from right to left\nC. from left to right\nD. from top to bottom", "gt-answer": "C. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1034736653": { "action": [ { "question": "What are the woman athletes doing?\nA. cycling\nB. swimming\nC. running\nD. dancing", "gt-answer": "C. running", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the primary action of the woman athletes?\nA. running\nB. reading\nC. singing\nD. cooking", "gt-answer": "A. running", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity are the woman athletes engaged in?\nA. skiing\nB. running\nC. painting\nD. playing basketball", "gt-answer": "B. running", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What sport are the woman athletes participating in?\nA. running\nB. gardening\nC. knitting\nD. soccer", "gt-answer": "A. running", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which action are the woman athletes performing?\nA. writing\nB. running\nC. driving\nD. shopping", "gt-answer": "B. running", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the woman closest to the camera?\nA. Normal speed\nB. Slowest speed\nC. The fastest speed", "gt-answer": "C. The fastest speed", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Compared to the other people in the video, how fast is the woman closest to the camera moving?\nA. Faster\nB. Same speed\nC. Slower", "gt-answer": "A. Faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Among the individuals in the video, who is moving at the highest speed?\nA. Woman closest to the camera\nB. Man in the background\nC. Other people in the video", "gt-answer": "A. Woman closest to the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In terms of speed, how does the woman closest to the camera rank?\nA. Slowest\nB. Fastest\nC. Middle", "gt-answer": "B. Fastest", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "In which direction are the woman athletes running?\nA. from right to left\nB. in circles\nC. from left to right", "gt-answer": "C. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "From which side are the woman athletes entering the screen?\nA. right\nB. top\nC. left\nD. bottom", "gt-answer": "C. left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way are the woman athletes heading?\nA. from left to right\nB. away from the camera\nC. from right to left\nD. towards the camera", "gt-answer": "A. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1098153561": { "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. time-lapse\nC. slow motion", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How fast is the video playing?\nA. very slow\nB. at a regular pace\nC. in fast forward", "gt-answer": "C. in fast forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following best describes the tempo of the video?\nA. sluggish\nB. steady\nC. accelerated", "gt-answer": "C. accelerated", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what manner is the video playing?\nA. gradually\nB. instantly\nC. quickly", "gt-answer": "C. quickly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the rate at which the video is being played?\nA. rapid\nB. slow-paced\nC. moderate", "gt-answer": "A. rapid", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the leaves?\nA. changing shape\nB. falling off\nC. changing color from green to red\nD. changing color from red to green", "gt-answer": "C. changing color from green to red", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the initial color of the leaves?\nA. red\nB. white\nC. green", "gt-answer": "C. green", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the final color of the leaves?\nA. white\nB. red\nC. green", "gt-answer": "B. red", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1084153195": { "action": [ { "question": "What are the dolphins doing in the water? \nA. Diving\nB. Swimming\nC. Sleeping\nD. Jumping", "gt-answer": "B. Swimming", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which activity can be observed in the dolphins? \nA. Dancing\nB. Swimming\nC. Climbing\nD. Diving", "gt-answer": "B. Swimming", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the action of the dolphins in the video? \nA. Swimming\nB. Jumping\nC. Flying\nD. Reading", "gt-answer": "A. Swimming", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What is the movement of the dolphins?\nA. swimming towards the shore\nB. hovering in one place\nC. swimming away from the shore", "gt-answer": "A. swimming towards the shore", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction are the dolphins swimming?\nA. parallel to the shore\nB. towards the shore\nC. away from the shore", "gt-answer": "B. towards the shore", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "If you observe the dolphins, what direction would you notice them heading?\nA. towards the shore\nB. parallel to the shore\nC. away from the shore", "gt-answer": "A. towards the shore", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the rate of movement in the video?\nA. fast speed\nB. no speed\nC. normal speed\nD. slow speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which word describes the pace of the video?\nA. stationary speed\nB. leisurely speed\nC. moderate speed\nD. rapid speed", "gt-answer": "C. moderate speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What term best describes the velocity of the video?\nA. average speed\nB. low speed\nC. high speed\nD. still speed", "gt-answer": "A. average speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What type of motion does the video exhibit?\nA. standard speed\nB. immobile speed\nC. sluggish speed\nD. swift speed", "gt-answer": "A. standard speed", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the tempo of the video?\nA. rapid speed\nB. unhurried speed\nC. regular speed\nD. static speed", "gt-answer": "C. regular speed", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the sequence of events involving dolphins?\nA. swimming towards the shore, then getting fed with fish\nB. swimming in circles\nC. getting fed with fish, then swimming towards the shore", "gt-answer": "A. swimming towards the shore, then getting fed with fish", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the first event that happens to the dolphins?\nA. Getting fed with fish\nB. None of the above\nC. Swimming towards the shore", "gt-answer": "C. Swimming towards the shore", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the last event in order that happens to the dolphins?\nA. None of the above\nB. Swimming towards the shore\nC. Getting fed with fish", "gt-answer": "C. Getting fed with fish", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1054717541": { "action": [ { "question": "What is the person doing?\nA. cutting dough\nB. kneading dough\nC. grilling dough", "gt-answer": "B. kneading dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action is the person performing?\nA. kneading dough\nB. cutting dough\nC. grilling dough", "gt-answer": "A. kneading dough", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In the video, what is the person engaged in?\nA. grilling dough\nB. kneading dough\nC. cutting dough", "gt-answer": "B. kneading dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity is the person involved in?\nA. kneading dough\nB. grilling dough\nC. cutting dough", "gt-answer": "A. kneading dough", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is demonstrated by the person?\nA. grilling dough\nB. kneading dough\nC. cutting dough", "gt-answer": "B. kneading dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "How is the video playing?\nA. in slow motion\nB. with a time-lapse effect\nC. at normal speed", "gt-answer": "A. in slow motion", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the tempo of the video playback?\nA. medium\nB. slow\nC. fast", "gt-answer": "B. slow", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In what way is the video playing?\nA. rapidly\nB. slowly\nC. consistently", "gt-answer": "B. slowly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the relative speed of the video compared to real-time?\nA. slower\nB. faster\nC. equal", "gt-answer": "A. slower", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1081092839": { "direction": [ { "question": "What is the direction of the sun?\nA. descending\nB. ascending\nC. moving sideways", "gt-answer": "A. descending", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the movement pattern of the sun?\nA. falling\nB. rising\nC. remaining still", "gt-answer": "A. falling", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the movement direction of the sun?\nA. descending\nB. ascending\nC. rotating", "gt-answer": "A. descending", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction does the sun travel during sunset?\nA. downwards\nB. upwards\nC. horizontally", "gt-answer": "A. downwards", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. time-lapse\nB. slow motion\nC. normal speed", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the tempo of the video?\nA. normal speed\nB. slow motion\nC. fast pace", "gt-answer": "C. fast pace", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which speed is the video playing at?\nA. time-lapse\nB. slow motion\nC. regular speed", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the rate of the video?\nA. regular speed\nB. slow motion\nC. time-lapse", "gt-answer": "C. time-lapse", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1059462749": { "action": [ { "question": "Which action is being performed by the person?\nA. reading a book\nB. cooking\nC. climbing down a ladder\nD. riding a bike", "gt-answer": "C. climbing down a ladder", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is taking place with the person?\nA. playing soccer\nB. painting a picture\nC. dancing\nD. climbing down a ladder", "gt-answer": "D. climbing down a ladder", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the main action of the person in the video?\nA. playing basketball\nB. climbing down a ladder\nC. singing\nD. running", "gt-answer": "B. climbing down a ladder", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is being demonstrated by the person?\nA. climbing down a ladder\nB. playing guitar\nC. writing a letter\nD. sleeping", "gt-answer": "A. climbing down a ladder", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "direction": [ { "question": "In which direction is the person moving?\nA. rightwards\nB. downwards\nC. upwards\nD. leftwards", "gt-answer": "B. downwards", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What word describes the movement of the person?\nA. standing\nB. descending\nC. climbing up\nD. jumping", "gt-answer": "B. descending", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "From a higher point to a lower point, the person is:\nA. rotating\nB. rising\nC. staying still\nD. descending", "gt-answer": "D. descending", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. time-lapse\nB. normal speed\nC. slow motion", "gt-answer": "B. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How fast is the video playing?\nA. slowly\nB. quickly\nC. normally", "gt-answer": "C. normally", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the pace of the video?\nA. regular\nB. accelerated\nC. decelerated", "gt-answer": "A. regular", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "At what rate is the video played?\nA. moderate speed\nB. slow speed\nC. fast speed", "gt-answer": "A. moderate speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what tempo is the video running?\nA. high speed\nB. normal speed\nC. low speed", "gt-answer": "B. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077590324": { "action": [ { "question": "What is the woman doing in the video?\nA. doing laundry\nB. cooking\nC. singing", "gt-answer": "A. doing laundry", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in?\nA. dancing\nB. doing laundry\nC. painting", "gt-answer": "B. doing laundry", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action is the woman performing?\nA. swimming\nB. doing laundry\nC. hiking", "gt-answer": "B. doing laundry", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What task is the woman involved in?\nA. knitting\nB. doing laundry\nC. gardening", "gt-answer": "B. doing laundry", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action is depicted in the video?\nA. reading\nB. sleeping\nC. doing laundry", "gt-answer": "C. doing laundry", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the entire video?\nA. slow motion\nB. normal speed\nC. time-lapse", "gt-answer": "B. normal speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the velocity of the video playback?\nA. low speed\nB. normal speed\nC. high speed", "gt-answer": "B. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what fashion is the video being played?\nA. rapid motion\nB. average speed\nC. slow motion", "gt-answer": "B. average speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the order of the events performed by the woman?\nA. Sitting down to operate the washing machine and then putting clothes into the washing machine\nB. Putting clothes into the washing machine and then standing up to operate the washing machine\nC. Operate the washing machine and then putting clothes into the washing machine\nD. Putting clothes into the washing machine and then sitting down to operate the washing machine", "gt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the sequence of actions taken by the woman?\nA. Turning off the washing machine and then getting dressed\nB. Putting clothes into the washing machine and then turning it on\nC. Turning off the washing machine and then putting clothes into it\nD. Getting dressed and then turning on the washing machine", "gt-answer": "B. Putting clothes into the washing machine and then turning it on", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the proper sequence of the woman's actions?\nA. Opening the door of the washing machine and then standing in front of it\nB. Standing in front of the washing machine and then opening the door\nC. Closing the door of the washing machine and then standing in front of it\nD. Standing in front of the washing machine and then closing the door", "gt-answer": "C. Closing the door of the washing machine and then standing in front of it", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1040541401": { "action": [ { "question": "What are the children doing?\nA. painting pictures\nB. reading books\nC. doing chemical experiments\nD. playing soccer", "gt-answer": "C. doing chemical experiments", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activities are the children engaged in?\nA. playing chess\nB. doing chemical experiments\nC. swimming in the pool\nD. dancing ballet", "gt-answer": "B. doing chemical experiments", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action are the children involved in?\nA. building sandcastles\nB. baking cookies\nC. doing chemical experiments\nD. playing hide and seek", "gt-answer": "C. doing chemical experiments", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the main action performed by the children?\nA. doing chemical experiments\nB. flying kites\nC. jumping on the trampoline\nD. riding bicycles", "gt-answer": "A. doing chemical experiments", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which activity are the children participating?\nA. singing in a choir\nB. acting in a play\nC. doing chemical experiments\nD. playing video games", "gt-answer": "C. doing chemical experiments", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. time-lapse\nB. normal speed\nC. super slow motion", "gt-answer": "B. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How fast is the video playing?\nA. normal speed\nB. very slow\nC. extremely fast", "gt-answer": "A. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what pace is the video running?\nA. rapid speed\nB. 10 times slow speed\nC. medium speed", "gt-answer": "C. medium speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059072773": { "attribute_change": [ { "question": "What is happening to the ice cream?\nA. melting\nB. freezing\nC. evaporating\nD. solidifying", "gt-answer": "A. melting", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the ice cream changing?\nA. changing color\nB. being eaten out\nC. turning into liquid\nD. solidifying into a ball", "gt-answer": "C. turning into liquid", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which term best describes the state change of the ice cream?\nA. evaporation\nB. solidifying\nC. melting", "gt-answer": "C. melting", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1064645467": { "action": [ { "question": "What is the man doing?\nA. cooking\nB. reading a book\nC. exercising\nD. watching TV", "gt-answer": "C. exercising", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which activity is the man engaged in?\nA. dancing\nB. doing exercise\nC. swimming\nD. painting", "gt-answer": "B. doing exercise", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In the video, what is the man involved in?\nA. knitting\nB. doing yoga\nC. horseback riding\nD. exercising intensively", "gt-answer": "D. exercising intensively", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What activity is the man participating in?\nA. exercising\nB. playing chess\nC. gardening\nD. business activity", "gt-answer": "A. exercising", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. slow motion\nB. time-lapse\nC. normal speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How fast is the video playing?\nA. normal speed\nB. fast speed\nC. slow speed", "gt-answer": "A. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what pace is the entire video played?\nA. moderately\nB. normally\nC. rapidly", "gt-answer": "B. normally", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which option describes the speed of the video accurately?\nA. slowest speed\nB. fastest speed\nC. normal speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the video playback rate?\nA. accelerated speed\nB. decelerated speed\nC. normal speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the order of events for the man?\nA. jumping up to grab the bar and then putting on his jacket\nB. putting on his jacket and then jumping up to grab the bar\nC. jumping up to grab the bar and then taking off his jacket\nD. taking off his jacket and then jumping up to grab the bar", "gt-answer": "D. taking off his jacket and then jumping up to grab the bar", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "When does the man jump up to grab the bar?\nA. before taking off his jacket\nB. after taking off his jacket\nC. while taking off his jacket", "gt-answer": "B. after taking off his jacket", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the man perform the actions?\nA. he jumps up to grab the bar and then takes off his jacket\nB. he jumps up to grab the bar and then takes off his jacket with his hands\nC. he takes off his jacket and then jumps up to grab the bar with his hands", "gt-answer": "C. he takes off his jacket and then jumps up to grab the bar with his hands", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1088279109": { "direction": [ { "question": "What is the elevator doing?\nA. rising\nB. going down\nC. staying still", "gt-answer": "A. rising", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the elevator moving?\nA. up\nB. down\nC. not moving", "gt-answer": "A. up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the direction of the elevator's movement?\nA. descending\nB. ascending\nC. stationary", "gt-answer": "B. ascending", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which way is the elevator going?\nA. up\nB. down\nC. stopped", "gt-answer": "A. up", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the video?\nA. slow motion\nB. time-lapse\nC. normal speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which mode is the video being played?\nA. normal speed\nB. fast forward\nC. rewind\nD. pause", "gt-answer": "A. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the tempo of the video?\nA. normal speed\nB. slow tempo\nC. no tempo\nD. fast tempo", "gt-answer": "A. normal speed", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1093573255": { "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. slow motion\nC. time-lapse", "gt-answer": "C. time-lapse", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "At what pace is the video running?\nA. steadily\nB. sluggishly\nC. rapidly", "gt-answer": "C. rapidly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "The video is played at what kind of speed?\nA. regular speed\nB. timelapse\nC. decelerated motion", "gt-answer": "B. timelapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the plant?\nA. wilting\nB. reviving\nC. shedding leaves\nD. turning into buds", "gt-answer": "B. reviving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the plant changing?\nA. withering away\nB. turning yellow\nC. reviving\nD. blooming", "gt-answer": "C. reviving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what way is the plant transforming?\nA. wilting\nB. rotting\nC. reviving\nD. shedding leaves", "gt-answer": "C. reviving", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1105233293": { "action": [ { "question": "What are the people doing in the video?\nA. swimming\nB. dancing\nC. playing basketball", "gt-answer": "C. playing basketball", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity are the people engaged in?\nA. playing basketball\nB. sleeping\nC. eating", "gt-answer": "A. playing basketball", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which sport are the people participating in?\nA. playing basketball\nB. soccer\nC. tennis", "gt-answer": "A. playing basketball", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the action of the people in the footage?\nA. playing basketball\nB. reading\nC. writing", "gt-answer": "A. playing basketball", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In the video, what are the people actively involved in?\nA. painting\nB. shopping\nC. playing basketball", "gt-answer": "C. playing basketball", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "speed": [ { "question": "How would you describe the pace of the video?\nA. accelerated speed\nB. normal speed\nC. reversed speed\nD. slow-motion", "gt-answer": "B. normal speed", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the tempo of the video playback?\nA. normal speed\nB. freeze frame\nC. time-lapse\nD. fast-forward", "gt-answer": "A. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which option best characterizes the speed of the entire video?\nA. decelerated motion\nB. quickened pace\nC. normal speed\nD. real-time speed", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the velocity at which the video is playing?\nA. rapid speed\nB. slow motion\nC. stopped frame\nD. normal speed", "gt-answer": "D. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the rate at which the video is progressing?\nA. slo-mo\nB. normal speed\nC. expedited speed\nD. rewinding speed", "gt-answer": "B. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the order of events in the video?\nA. Shooting the basketball and then passing the ball to each other\nB. Shooting the basketball and then dribbling the ball\nC. Passing the ball to each other and then shooting the basketball", "gt-answer": "C. Passing the ball to each other and then shooting the basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the sequence of actions performed by the players?\nA. Shooting the basketball and then passing the ball to each other\nB. Shooting the basketball and then blocking the opponent\nC. Passing the ball to each other and then shooting the basketball", "gt-answer": "C. Passing the ball to each other and then shooting the basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Arrange the events involving the players in the correct order.\nA. dribbling, shooting, passing the basketball\nB. shooting the basketball, passing the ball to each other\nC. passing the ball to each other, shooting the basketball", "gt-answer": "C. passing the ball to each other, shooting the basketball", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077146132": { "action": [ { "question": "What is the woman doing in the video?\nA. waking up\nB. tossing and turning in the bed\nC. falling asleep", "gt-answer": "A. waking up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is the woman performing?\nA. waking up\nB. tossing and turning in the bed\nC. falling asleep", "gt-answer": "A. waking up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the woman engaged in?\nA. tossing and turning in the bed\nB. waking up\nC. falling asleep", "gt-answer": "B. waking up", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what is the woman's activity?\nA. waking up\nB. tossing and turning in the bed\nC. falling asleep", "gt-answer": "A. waking up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is depicted in the video?\nA. falling asleep\nB. waking up\nC. tossing and turning in the bed", "gt-answer": "B. waking up", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the first event in the sequence?\nA. Getting out of bed\nB. Opening the curtains\nC. Both events happen simultaneously", "gt-answer": "A. Getting out of bed", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which event occurs after getting out of bed?\nA. Opening the curtains\nB. Closing the curtains\nC. None of the above", "gt-answer": "A. Opening the curtains", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the last event to occur?\nA. Opening the curtains\nB. None of the above\nC. Getting out of bed", "gt-answer": "A. Opening the curtains", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the video?\nA. staying the same brightness\nB. turning darker\nC. turning brighter", "gt-answer": "C. turning brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the video change in terms of brightness?\nA. decreasing\nB. remaining constant\nC. increasing", "gt-answer": "C. increasing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is occurring with the video's attribute?\nA. maintaining steady brightness\nB. getting brighter\nC. getting dimmer", "gt-answer": "B. getting brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086688682": { "attribute_change": [ { "question": "What change is happening to the traffic lights?\nA. From red to green\nB. From red to yellow\nC. From yellow to red\nD. From green to red", "gt-answer": "A. From red to green", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the attribute change occurring to the traffic lights?\nA. Changing color sequence\nB. Dimming brightness\nC. Switching off\nD. Blinking rapidly", "gt-answer": "A. Changing color sequence", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What alteration is taking place to the traffic lights?\nA. Transitioning from yellow to green\nB. Transitioning from green to yellow\nC. Transitioning from red to green\nD. Transitioning from green to red", "gt-answer": "C. Transitioning from red to green", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1096612823": { "action": [ { "question": "In the video, what can be observed about the car's movement?\nA. sliding on ice\nB. dancing on the rooftop\nC. buried in the sand\nD. driving on the road", "gt-answer": "D. driving on the road", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is happening to the car?\nA. driving on the road\nB. being fixed\nC. sleeping", "gt-answer": "A. driving on the road", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the car doing in the scene?\nA. flying in the sky\nB. swimming in the ocean\nC. parked on the sidewalk\nD. driving on the road", "gt-answer": "D. driving on the road", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What is happening to the video?\nA. zooming out\nB. rotating\nC. panning left\nD. zooming in", "gt-answer": "D. zooming in", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of the video?\nA. panning left\nB. fading out\nC. zooming in\nD. moving backward", "gt-answer": "C. zooming in", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the video changing?\nA. panning upwards\nB. rewinding\nC. zooming out\nD. zooming in", "gt-answer": "D. zooming in", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1075484900": { "direction": [ { "question": "Which way is the child facing in relation to the man?\nA. Forward\nB. Turning towards the man\nC. Turning away from the man\nD. Backward", "gt-answer": "C. Turning away from the man", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction is the child moving in relation to the man?\nA. Backward\nB. Forward\nC. Turning away from the man\nD. Turning towards the man", "gt-answer": "C. Turning away from the man", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the orientation of the child with respect to the man?\nA. Downwards\nB. Upwards\nC. Turning away from the man\nD. Turning towards the man", "gt-answer": "C. Turning away from the man", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1090578917": { "action": [ { "question": "What is the man doing?\nA. playing soccer\nB. painting a picture\nC. reading a book\nD. cooking dinner", "gt-answer": "A. playing soccer", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity is the man engaged in?\nA. playing soccer\nB. dancing\nC. singing\nD. swimming", "gt-answer": "A. playing soccer", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What sport is the man participating in?\nA. volleyball\nB. basketball\nC. soccer\nD. tennis", "gt-answer": "C. soccer", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What recreational activity is the man involved in?\nA. playing chess\nB. gardening\nC. hiking\nD. playing soccer", "gt-answer": "D. playing soccer", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "In what physical activity is the man actively involved?\nA. playing soccer\nB. weightlifting\nC. biking\nD. jogging", "gt-answer": "A. playing soccer", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events in the video?\nA. The man is not leaping to his right nor standing up\nB. The man is standing up and then leaping to his right\nC. The man is leaping to his right and then standing up", "gt-answer": "C. The man is leaping to his right and then standing up", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. The man is standing up from ground\nB. The man is leaping to his right\nC. Nothing is happening", "gt-answer": "B. The man is leaping to his right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening second in the video?\nA. There is no specific order\nB. The man is standing up from ground\nC. The man is leaping to his right", "gt-answer": "B. The man is standing up from ground", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What direction is the man leaping?\nA. to his left\nB. backward\nC. forward\nD. to his right", "gt-answer": "D. to his right", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which way is the man moving?\nA. left\nB. forwards\nC. right\nD. up", "gt-answer": "C. right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of the man's movement?\nA. counterclockwise\nB. horizontal\nC. vertically\nD. clockwise", "gt-answer": "B. horizontal", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1075338140": { "direction": [ { "question": "What is the direction of the ball?\nA. forward and backward\nB. spinning in place\nC. rolling from left to right\nD. rolling from right to left", "gt-answer": "C. rolling from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the ball moving?\nA. counterclockwise\nB. rolling from left to right\nC. clockwise\nD. rolling from right to left", "gt-answer": "B. rolling from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction does the ball travel?\nA. straight ahead\nB. rolling from left to right\nC. rolling from right to left\nD. floating in mid-air", "gt-answer": "B. rolling from left to right", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1067268403": { "direction": [ { "question": "What is the movement direction of the wind turbines?\nA. Stationary\nB. Rotating clockwise\nC. Rotating counterclockwise", "gt-answer": "B. Rotating clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which way are the wind turbines rotating?\nA. Randomly\nB. Clockwise\nC. Anti-clockwise", "gt-answer": "B. Clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In which direction are the wind turbines turning?\nA. Anticlockwise\nB. Still\nC. Clockwise", "gt-answer": "C. Clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the rotational direction of the wind turbines?\nA. Clockwise\nB. Anti-clockwise\nC. Unchanging", "gt-answer": "A. Clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1072594556": { "speed": [ { "question": "How would you describe the speed of the car in the center of the screen?\nA. slower than other cars\nB. faster than other cars\nC. at the same speed as other cars", "gt-answer": "B. faster than other cars", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Compared to other cars, how does the car in the center of the screen move?\nA. At the same speed\nB. Faster\nC. Slower\nD. Information unavailable", "gt-answer": "B. Faster", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What do we know about the car's motion relative to other objects on the screen?\nA. It is the fastest\nB. It is the slowest\nC. There is no motion\nD. Same speed as the others", "gt-answer": "A. It is the fastest", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1096007487": { "direction": [ { "question": "From the camera's point of view, in which direction is the 3d cloud moving?\nA. upward\nB. downward\nC. leftward\nD. rightward", "gt-answer": "C. leftward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the 3d cloud moving from the camera's point of view?\nA. contracting\nB. spinning leftward\nC. spinning rightward\nD. expanding", "gt-answer": "B. spinning leftward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement pattern of the 3d cloud as seen from the camera's point of view?\nA. from right to left\nB. rotating clockwise\nC. rotating counter-clockwise\nD. from left to right", "gt-answer": "A. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1095939659": { "direction": [ { "question": "In which direction is the light growing?\nA. Downwards\nB. Clockwise\nC. Counterclockwise\nD. Upwards", "gt-answer": "B. Clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the direction of the light's movement?\nA. Clockwise\nB. Anticlockwise\nC. Straight forward\nD. Downwards", "gt-answer": "A. Clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the light changing direction?\nA. Spinning vertically\nB. Rotating clockwise\nC. Shifting diagonally\nD. Growing counterclockwise", "gt-answer": "B. Rotating clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059632327": { "direction": [ { "question": "What is the direction of the tennis ball?\nA. bouncing up and down\nB. spinning clockwise and anticlockwise\nC. rolling forward and backward\nD. bouncing left to right", "gt-answer": "A. bouncing up and down", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which direction does the tennis ball move in?\nA. moving in a circular path\nB. floating in mid-air\nC. moving in a zigzag pattern\nD. bouncing up and down", "gt-answer": "D. bouncing up and down", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction does the tennis ball travel?\nA. bouncing up and down\nB. shooting straight ahead\nC. staying stationary\nD. bouncing side to side", "gt-answer": "A. bouncing up and down", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1098785169": { "direction": [ { "question": "What is the direction of the galaxy's spin?\nA. counterclockwise\nB. left to right\nC. clockwise\nD. up and down", "gt-answer": "C. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the galaxy rotating?\nA. backward\nB. counter clockwise\nC. clockwise\nD. forward", "gt-answer": "C. clockwise", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "How is the galaxy spinning?\nA. backward\nB. counter clockwise\nC. clockwise\nD. forward", "gt-answer": "C. clockwise", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1099984801": { "direction": [ { "question": "What is the movement of the clouds?\nA. moving away from the camera\nB. staying still\nC. moving towards the camera", "gt-answer": "C. moving towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction are the clouds heading?\nA. towards the camera\nB. upward\nC. downward\nD. away from the camera", "gt-answer": "A. towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the movement direction of the clouds?\nA. forward\nB. in a circular motion\nC. side to side\nD. backward", "gt-answer": "D. backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. slow motion\nC. time-lapse", "gt-answer": "C. time-lapse", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What speed is the video set to?\nA. time-lapse\nB. time dilation\nC. real-time", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the pacing of the video?\nA. accelerating\nB. decelerating\nC. normal speed", "gt-answer": "A. accelerating", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the entire video?\nA. staying the same\nB. getting darker\nC. getting brighter", "gt-answer": "B. getting darker", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What change is occurring to the light condition of the video?\nA. getting darker\nB. remaining stable\nC. getting brighter", "gt-answer": "A. getting darker", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following best describes the change in the entire video?\nA. getting darker\nB. getting blurry\nC. turning brighter", "gt-answer": "A. getting darker", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1082419672": { "direction": [ { "question": "What is the direction of movement in the video?\nA. hovering\nB. flying forwards\nC. flying backwards", "gt-answer": "C. flying backwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the trajectory of the movement?\nA. straight line\nB. arc-shaped\nC. zigzag", "gt-answer": "A. straight line", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In what direction is the entire video moving relative to the ship?\nA. forward\nB. up\nC. down\nD. backward", "gt-answer": "D. backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1058985719": { "direction": [ { "question": "What is the direction in which the airplane is flying?\nA. bottom to top\nB. right to left\nC. top to bottom\nD. left to right", "gt-answer": "A. bottom to top", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which way is the airplane moving on the screen?\nA. anticlockwise\nB. upwards\nC. clockwise\nD. downwards", "gt-answer": "B. upwards", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the trajectory of the airplane?\nA. vertically upwards\nB. vertically downwards\nC. horizontally rightwards\nD. horizontally leftwards", "gt-answer": "A. vertically upwards", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1055413730": { "direction": [ { "question": "In which direction is the planet Earth spinning?\nA. Rightwards\nB. Downwards\nC. Leftwards\nD. Upwards", "gt-answer": "A. Rightwards", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Considering the camera's perspective, what is the rotational movement of the planet Earth?\nA. spinning to the left\nB. rotating upward\nC. spinning to the right", "gt-answer": "C. spinning to the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the apparent motion of the Earth based on the camera's viewpoint?\nA. away from the camera\nB. towards the camera\nC. spinning to the right\nD. spinning to the left", "gt-answer": "C. spinning to the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1081684532": { "direction": [ { "question": "What is the direction of the asteroids in the video?\nA. flying away from the camera\nB. flying to the left\nC. flying towards the camera\nD. flying to the right", "gt-answer": "C. flying towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction are the asteroids moving?\nA. downwards\nB. towards the camera\nC. upwards\nD. away from the camera", "gt-answer": "B. towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way are the asteroids going?\nA. towards the camera\nB. parallel to the camera\nC. away from the camera", "gt-answer": "A. towards the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "23391142": { "action": [ { "question": "What are the people doing in the video?\nA. dancing\nB. playing badminton\nC. reading books", "gt-answer": "B. playing badminton", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity are the people engaged in?\nA. swimming\nB. playing badminton\nC. playing soccer", "gt-answer": "B. playing badminton", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which of the following activities are the people participating in?\nA. playing badminton\nB. hiking\nC. baking cookies", "gt-answer": "A. playing badminton", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action can be seen in the video?\nA. knitting\nB. playing badminton\nC. painting", "gt-answer": "B. playing badminton", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is happening in the video?\nA. sleeping\nB. singing\nC. playing badminton", "gt-answer": "C. playing badminton", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What direction is the video panning?\nA. Upwards\nB. Downwards\nC. To the left\nD. To the right", "gt-answer": "D. To the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement of the video?\nA. Zoom in\nB. Panning to the left\nC. Zoom out\nD. Panning to the right", "gt-answer": "D. Panning to the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the scene shifting?\nA. Panning to the left\nB. Panning to the right\nC. Away from the camera\nD. Towards the camera", "gt-answer": "B. Panning to the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. slow motion\nC. time-lapse", "gt-answer": "B. slow motion", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How fast is the video playing?\nA. quickly\nB. at a moderate pace\nC. slowly", "gt-answer": "C. slowly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which speed mode is applied to the video?\nA. regular speed\nB. accelerated\nC. slow motion", "gt-answer": "C. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the video playback rate?\nA. fast\nB. slow\nC. moderate", "gt-answer": "B. slow", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what kind of speed is the video shown?\nA. slow motion\nB. rapid\nC. normal", "gt-answer": "A. slow motion", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1078368947": { "action": [ { "question": "What is the woman doing in the bathroom?\nA. reading a book while taking a shower\nB. writing letter while taking a bath\nC. reading a book while taking a bath", "gt-answer": "C. reading a book while taking a bath", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity is the woman engaged in?\nA. reading a book while taking a bath\nB. listening to music while taking a bath\nC. drinking wine while taking a bath", "gt-answer": "A. reading a book while taking a bath", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the woman involved in?\nA. washing her hair while taking a bath\nB. reading a book while taking a bath\nC. washing her face while taking a bath", "gt-answer": "B. reading a book while taking a bath", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1099738787": { "attribute_change": [ { "question": "What is happening to the concrete wall?\nA. melting\nB. falling apart\nC. assembling together", "gt-answer": "B. falling apart", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the attribute change of the concrete wall?\nA. rebuilding\nB. shrinking\nC. disappearing\nD. falling apart", "gt-answer": "D. falling apart", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "In what state is the concrete wall?\nA. expanding\nB. assembling together\nC. falling apart\nD. intact", "gt-answer": "C. falling apart", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1094219575": { "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. time-lapse\nC. slow motion\nD. fast forwarding", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which term describes how the video is played?\nA. time-lapse\nB. rewinded\nC. decelerated\nD. paused", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the video being played?\nA. as a time-lapse\nB. on fast forward\nC. in slow motion\nD. at a regular pace", "gt-answer": "A. as a time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What type of speed is applied to the video?\nA. gradual speed\nB. erratic speed\nC. time-lapse speed\nD. variable speed", "gt-answer": "C. time-lapse speed", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In what way is the video being shown?\nA. rapidly\nB. in real-time\nC. as a time-lapse\nD. in slow motion", "gt-answer": "C. as a time-lapse", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the flowers?\nA. growing taller\nB. changing color\nC. blooming\nD. wilting", "gt-answer": "D. wilting", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the condition of the flowers?\nA. decaying\nB. dormant\nC. budding\nD. blooming", "gt-answer": "A. decaying", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the transformation occurring to the flowers?\nA. reproducing through seeds\nB. changing from withered to full blossom\nC. changing from full blossom to withered\nD. sprouting new buds", "gt-answer": "C. changing from full blossom to withered", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1053758117": { "direction": [ { "question": "What is happening in the video?\nA. Zoom out from a 3D digital brain\nB. Standing still before a 3D digital brain\nC. Zoom into a 3D digital brain", "gt-answer": "C. Zoom into a 3D digital brain", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the camera moving in the video?\nA. zooming in\nB. downwards\nC. upwards\nD. zooming out", "gt-answer": "A. zooming in", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How would you describe the trajectory of the video's direction?\nA. panning right\nB. panning left\nC. zooming out\nD. zooming in", "gt-answer": "D. zooming in", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1069717165": { "order": [ { "question": "How does the woman arrange her head movements?\nA. nodding and shaking her head repeatedly\nB. shaking her head, followed by nodding her head\nC. nodding her head, followed by shaking her head", "gt-answer": "B. shaking her head, followed by nodding her head", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What does the woman do after shaking her heads?\nA. feeling sad\nB. nothing\nC. nodding her head\nD. left away", "gt-answer": "C. nodding her head", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which actions did the woman take and in what order?\nA. shaking her head and then shaking it again\nB. nodding her head and then nodding it again\nC. nodding her head and then shaking her head\nD. shaking her whole body and then turning around", "gt-answer": "A. shaking her head and then shaking it again", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1041584314": { "order": [ { "question": "In what order does the man's expression change?\nA. The man doesn't change his expression\nB. Smiling, then showing a serious expression\nC. Showing a serious expression, then smiling", "gt-answer": "C. Showing a serious expression, then smiling", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "When does the man start to smile?\nA. After showing a serious expression\nB. Before showing a serious expression\nC. The man doesn't smile", "gt-answer": "A. After showing a serious expression", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How did the man's facial expressions change over time?\nA. from serious to smiling\nB. no change in expressions\nC. from smiling to serious", "gt-answer": "A. from serious to smiling", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1067427023": { "speed": [ { "question": "What is the speed of the video?\nA. normal speed\nB. time-lapse\nC. slow motion", "gt-answer": "B. time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How fast is the video playing?\nA. time-lapse\nB. normal speed\nC. slow motion", "gt-answer": "A. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what manner is the video progressing?\nA. real-time\nB. slow motion\nC. sped up", "gt-answer": "C. sped up", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Which term best describes the transformation happening to the snow particles?\nA. solidifying\nB. melting\nC. scattering", "gt-answer": "B. melting", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What change is occurring to the snow particles?\nA. remaining the same\nB. growing in size\nC. decreasing in size", "gt-answer": "C. decreasing in size", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In the given scenario, what is the primary attribute change experienced by the snow particles?\nA. freezing\nB. melting\nC. scattering", "gt-answer": "B. melting", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1093948229": { "attribute_change": [ { "question": "What is happening to the golden particles?\nA. melting\nB. shrinking\nC. spinning\nD. exploding", "gt-answer": "D. exploding", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following best describes the change in the attribute of the golden particles?\nA. freezing\nB. exploding\nC. melting\nD. shrinking", "gt-answer": "B. exploding", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which word below represents the transformation taking place on the golden particles?\nA. contracting\nB. melting\nC. exploding\nD. condensing", "gt-answer": "C. exploding", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1106668103": { "direction": [ { "question": "What is the direction of movement in the video?\nA. staying still\nB. moving forward\nC. moving backward", "gt-answer": "B. moving forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what way is the primary motion depicted in the video?\nA. turning leftward\nB. moving forward\nC. moving backward\nD. turning rightward", "gt-answer": "B. moving forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the primary trajectory in the video?\nA. descending\nB. moving backward\nC. moving forward", "gt-answer": "C. moving forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1049965795": { "attribute_change": [ { "question": "What is happening to the light bulb?\nA. turning off\nB. breaking\nC. light up\nD. rapidly changing color", "gt-answer": "C. light up", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What change occurs in the light bulb?\nA. becoming darker\nB. getting smaller\nC. light up\nD. flickering", "gt-answer": "C. light up", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What alteration takes place in the light bulb?\nA. rusting\nB. turn off\nC. crackling\nD. light up", "gt-answer": "D. light up", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1052364490": { "attribute_change": [ { "question": "What is happening to the digital bar chart?\nA. staying in the same size\nB. increasing\nC. decreasing", "gt-answer": "B. increasing", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "The digital bar chart is experiencing what kind of change?\nA. decreasing\nB. growing\nC. fluctuating", "gt-answer": "B. growing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What alteration is taking place to the digital bar chart?\nA. levelling out\nB. growing\nC. disappearing", "gt-answer": "B. growing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1080990179": { "attribute_change": [ { "question": "What is happening to the apple?\nA. being cut\nB. shrinking and drying out\nC. growing bigger", "gt-answer": "B. shrinking and drying out", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the apple changing?\nA. getting smaller\nB. remaining in the same shape\nC. getting bigger", "gt-answer": "A. getting smaller", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the change in the apple's attributes?\nA. swelling and becoming juicy\nB. shrinking and drying out\nC. being cut and getting smaller", "gt-answer": "B. shrinking and drying out", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1057163434": { "direction": [ { "question": "What is the chef doing with the bread?\nA. removing it from the top of the burger\nB. putting it on top of the burger\nC. putting it inside the burger\nD. throwing it away", "gt-answer": "B. putting it on top of the burger", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction is the chef moving the bread?\nA. throwing it away\nB. removing it from the burger\nC. putting it on top of the burger\nD. putting it inside the burger", "gt-answer": "C. putting it on top of the burger", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action is the chef performing with the bread?\nA. putting it on top of the burger\nB. picking it up from the burger\nC. inserting it inside the burger", "gt-answer": "A. putting it on top of the burger", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1085910917": { "action": [ { "question": "What is the woman doing in the video?\nA. drinking\nB. sleeping\nC. dancing", "gt-answer": "A. drinking", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in?\nA. running\nB. drinking\nC. cooking", "gt-answer": "B. drinking", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In the video, what is the action performed by the woman?\nA. reading\nB. swimming\nC. drinking", "gt-answer": "C. drinking", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What behavior is exhibited by the woman?\nA. drinking\nB. eating\nC. talking", "gt-answer": "A. drinking", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is being carried out by the woman?\nA. drawing\nB. drinking\nC. walking", "gt-answer": "B. drinking", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "In what sequence do the events occur in the video?\nA. drinking a glass of water and then turning back\nB. turning back and then drinking a glass of water\nC. both events occur at the same time", "gt-answer": "A. drinking a glass of water and then turning back", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the first event that happened?\nA. turning back\nB. both events occur simultaneously\nC. drinking a glass of water", "gt-answer": "C. drinking a glass of water", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the second event that happened?\nA. drinking a glass of water\nB. both events occur simultaneously\nC. turning back", "gt-answer": "C. turning back", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1058907236": { "action": [ { "question": "What is the squirrel doing in the park?\nA. Sleeping\nB. Swimming\nC. Foraging\nD. Dancing", "gt-answer": "C. Foraging", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the squirrel performing?\nA. Running around\nB. Taking a rest\nC. Foraging for mushroom\nD. Foraging for nuts", "gt-answer": "D. Foraging for nuts", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the main activity of the squirrel?\nA. Building a nest\nB. Foraging for nuts\nC. Hibernating \nD. Jumping", "gt-answer": "B. Foraging for nuts", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the correct order of the events?\nA. Cannot be determined from the given information\nB. Turning back followed by picking up a nut\nC. Picking up a nut followed by turning back", "gt-answer": "C. Picking up a nut followed by turning back", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the first event in the sequence?\nA. Picking up a nut\nB. Turning back\nC. Cannot be determined from the given information", "gt-answer": "A. Picking up a nut", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the second event in the sequence?\nA. Turning back\nB. Cannot be determined from the given information\nC. Picking up a nut", "gt-answer": "A. Turning back", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which event happens before the other?\nA. Turning back\nB. Cannot be determined from the given information\nC. Picking up a nut", "gt-answer": "C. Picking up a nut", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1077575504": { "attribute_change": [ { "question": "What is happening to the pile of salt?\nA. scattering\nB. growing\nC. melting\nD. disappearing", "gt-answer": "B. growing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which one of the following is an attribute change happening to the pile of salt?\nA. shrinking\nB. growing\nC. burning\nD. dissolving", "gt-answer": "B. growing", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "How is the pile of salt changing?\nA. melting\nB. unchanged\nC. growing bigger\nD. becoming smaller", "gt-answer": "C. growing bigger", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "23370985": { "attribute_change": [ { "question": "What is happening to the ice crystal?\nA. freezing\nB. melting\nC. shattering", "gt-answer": "A. freezing", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What process is occurring with the ice crystal?\nA. reducing in size\nB. turning into water\nC. growing in size\nD. remaining the same", "gt-answer": "C. growing in size", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What transformation is taking place in the ice crystal?\nA. cracking\nB. unchanged\nC. melting\nD. forming", "gt-answer": "D. forming", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100319395": { "direction": [ { "question": "What direction is the circular pattern moving?\nA. clockwise\nB. towards the camera\nC. counter-clockwise\nD. away from the camera", "gt-answer": "A. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which way is the circular pattern moving?\nA. spinning clockwise\nB. spinning counter-clockwise\nC. vibrating back and forth", "gt-answer": "A. spinning clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the circular pattern spinning?\nA. towards the screen\nB. anticlockwise\nC. clockwise\nD. away from the screen", "gt-answer": "C. clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1067268406": { "speed": [ { "question": "What is the speed of the car?\nA. at the same speed as the camera\nB. faster than the camera\nC. slower than the camera", "gt-answer": "B. faster than the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the car's speed compare to the camera's speed?\nA. It is faster.\nB. It is slower.\nC. They have the same speed.", "gt-answer": "A. It is faster.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Does the car move at a different speed compared to the camera?\nA. Yes, it moves faster.\nB. Yes, it moves slower.\nC. No, they move at the same speed.", "gt-answer": "A. Yes, it moves faster.", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1092682551": { "speed": [ { "question": "What is the speed of the cars compared to the camera?\nA. travel at the same speed as the camera\nB. faster than the camera\nC. travel slower than the camera", "gt-answer": "C. travel slower than the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the cars' speed compare to the camera's speed?\nA. They have the same speed.\nB. They are slower.\nC. They are faster.", "gt-answer": "B. They are slower.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Do the cars move at a different speed compared to the camera?\nA. Yes, they move faster.\nB. No, they move at the same speed.\nC. Yes, they move slower.", "gt-answer": "C. Yes, they move slower.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1101200293": { "direction": [ { "question": "What is the direction of the camera motion relative to the aircraft carrier?\nA. counterclockwise\nB. downward\nC. upward\nD. clockwise", "gt-answer": "D. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the camera moving around the aircraft carrier?\nA. clockwise\nB. back and forth\nC. tilting upwards\nD. counterclockwise", "gt-answer": "A. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction is the camera flying around the aircraft carrier?\nA. clockwise\nB. descending\nC. ascending\nD. anti-clockwise", "gt-answer": "A. clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1072453637": { "direction": [ { "question": "What is the direction of the camera panning in the video?\nA. panning to the back of a fighter jet\nB. panning downwards around a fighter jet\nC. panning upwards around a fighter jet\nD. panning to the front of a fighter jet", "gt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the camera's panning orientation in the video?\nA. Moving to the front of a fighter jet\nB. Ascending around a fighter jet\nC. Moving to the rear of a fighter jet\nD. Descending around a fighter jet", "gt-answer": "C. Moving to the rear of a fighter jet", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Identify the camera's panning movement in the video.\nA. Panning to the back of a fighter jet\nB. Panning upward around a fighter jet\nC. Panning downward around a fighter jet\nD. Panning to the front of a fighter jet", "gt-answer": "A. Panning to the back of a fighter jet", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "What was the order of events for the fighter jet in the video?\nA. shooting three missiles, then shooting four missiles\nB. shooting two missiles, then shooting one missile\nC. shooting one missile, then shooting two missiles\nD. shooting four missiles, then shooting three missiles", "gt-answer": "C. shooting one missile, then shooting two missiles", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What did the fighter jet do first in the video?\nA. shooting two missiles\nB. shooting one missile\nC. shooting three missiles\nD. shooting four missiles", "gt-answer": "B. shooting one missile", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What did the fighter jet do latter in the video?\nA. shooting three missiles\nB. shooting two missiles\nC. shooting one missile\nD. shooting four missiles", "gt-answer": "B. shooting two missiles", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3396473605": { "direction": [ { "question": "In which direction do the five stars appear?\nA. from right to left\nB. from top to bottom\nC. from left to right\nD. from bottom to top", "gt-answer": "C. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which star appears first?\nA. the star in the center\nB. the star in the right\nC. the star in the left\nD. all stars appear at the same time", "gt-answer": "C. the star in the left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction that the stars appear?\nA. from right to left\nB. from left to right\nC. upwards\nD. downwards", "gt-answer": "B. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086820415": { "direction": [ { "question": "What is the direction of motion of the large wave?\nA. moving vertically towards the top of the screen\nB. moving horizontally towards the right side of the screen\nC. moving vertically towards the bottom of the screen\nD. moving horizontally towards the left side of the screen", "gt-answer": "C. moving vertically towards the bottom of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction does the large wave move in the video?\nA. vertically towards the top of the screen\nB. diagonally towards the bottom-right corner\nC. vertically towards the bottom of the screen\nD. diagonally towards the top-left corner", "gt-answer": "C. vertically towards the bottom of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the large wave travel across the screen?\nA. moving vertically towards the bottom\nB. contracting towards the center\nC. moving vertically towards the top\nD. expanding from the center", "gt-answer": "A. moving vertically towards the bottom", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1081513610": { "action": [ { "question": "What is the man doing in the video?\nA. swimming\nB. discussing\nC. sleeping\nD. running", "gt-answer": "B. discussing", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What action is the man performing?\nA. discussing\nB. reading\nC. cooking\nD. dancing", "gt-answer": "A. discussing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which activity is the man engaged in?\nA. singing\nB. playing basketball\nC. discussing\nD. painting", "gt-answer": "C. discussing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the man occupied with?\nA. discussing\nB. shopping\nC. working out\nD. gardening", "gt-answer": "A. discussing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What does the man participate in?\nA. biking\nB. hiking\nC. fishing\nD. discussing", "gt-answer": "D. discussing", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1073831006": { "action": [ { "question": "What are the zebras doing in the video?\nA. swimming\nB. sleeping\nC. running", "gt-answer": "C. running", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which of the following actions are the zebras performing?\nA. running\nB. jumping\nC. eating", "gt-answer": "A. running", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In the video, what can we see the zebras doing?\nA. running\nB. standing still\nC. drinking water", "gt-answer": "A. running", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What is the direction of the zebras' movement?\nA. from right to left\nB. from left to right\nC. from top to bottom", "gt-answer": "B. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction are the zebras moving?\nA. from left to right relative to the camera\nB. away from the camera\nC. towards the camera\nD. from right to left relative to the camera", "gt-answer": "A. from left to right relative to the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which direction are the zebras heading?\nA. downward\nB. leftward\nC. rightward\nD. upward", "gt-answer": "C. rightward", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ], "speed": [ { "question": "What is the speed of the zebras in the video?\nA. slow motion\nB. stationary\nC. fast motion\nD. normal speed", "gt-answer": "A. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "How fast is the video playing?\nA. normal speed\nB. time-lapse\nC. slow motion", "gt-answer": "C. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which option describes the rate at which the video is playing?\nA. accelerated\nB. normal speed\nC. slow motion", "gt-answer": "C. slow motion", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1069338034": { "action": [ { "question": "What are the elephants doing in the video?\nA. eating and drinking\nB. sleeping and resting\nC. eating and playing", "gt-answer": "A. eating and drinking", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which action is observed in the video?\nA. swimming and taking bath\nB. swimming and drinking\nC. eating and drinking", "gt-answer": "C. eating and drinking", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity are the elephants engaged in?\nA. swimming and cleaning themselves\nB. eating and drinking\nC. swimming and resting", "gt-answer": "B. eating and drinking", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1076880707": { "action": [ { "question": "What is the bear doing near the tree?\nA. eating honey\nB. climbing a tree\nC. scratching against a tree", "gt-answer": "C. scratching against a tree", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the bear engaged in?\nA. climbing a tree\nB. taking a nap under the tree\nC. scratching against a tree", "gt-answer": "C. scratching against a tree", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action can be seen in the video?\nA. scratching against a tree\nB. sleeping against the tree\nC. eating under the tree", "gt-answer": "A. scratching against a tree", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1092278063": { "direction": [ { "question": "What is the direction of the two rows of duck toy?\nA. moving in opposite directions on a conveyor belt\nB. moving in the same direction on a conveyor belt\nC. not moving on a conveyor belt", "gt-answer": "A. moving in opposite directions on a conveyor belt", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the movement pattern of the two rows of duck toy on a conveyor belt?\nA. circular motion\nB. straight motion\nC. zigzag motion", "gt-answer": "B. straight motion", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction are the two rows of duck toy moving relative to each other?\nA. perpendicular to each other\nB. in opposite directions\nC. in the same direction", "gt-answer": "B. in opposite directions", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "What is the speed of the conveyor belt?\nA. normal speed\nB. stopped\nC. super fast speed\nD. slow speed", "gt-answer": "A. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How fast is the conveyor belt moving?\nA. very slowly\nB. very quickly\nC. at a moderate pace\nD. not moving at all", "gt-answer": "C. at a moderate pace", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the velocity of the conveyor belt?\nA. zero velocity\nB. extreme high velocity\nC. extreme low velocity\nD. moderate velocity", "gt-answer": "D. moderate velocity", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1024867412": { "action": [ { "question": "What is the dog doing in the video?\nA. eating\nB. driving a car\nC. sleeping\nD. barking", "gt-answer": "B. driving a car", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which activity is the dog engaged in?\nA. reading a book\nB. swimming\nC. cooking\nD. driving a car", "gt-answer": "D. driving a car", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What action is the dog performing?\nA. painting\nB. dancing\nC. driving a car\nD. singing", "gt-answer": "C. driving a car", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What can be seen in the video involving the dog?\nA. driving a car\nB. flying a kite\nC. running\nD. playing soccer", "gt-answer": "A. driving a car", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is being carried out by the dog?\nA. building a sandcastle\nB. driving a car\nC. riding a bike\nD. knitting", "gt-answer": "B. driving a car", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What direction is the car driving?\nA. Taking a left turn\nB. Going straight\nC. Taking a right turn\nD. Going backward", "gt-answer": "C. Taking a right turn", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the car moving?\nA. Left\nB. Right\nC. Backward\nD. Forward", "gt-answer": "B. Right", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What maneuver is the car making?\nA. Making a left turn\nB. Parked on the street\nC. Driving backward\nD. Making a right turn", "gt-answer": "D. Making a right turn", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1076877854": { "action": [ { "question": "What are the robots doing in the field?\nA. caring for seedlings\nB. watering plants\nC. harvesting crops\nD. plowing the soil", "gt-answer": "A. caring for seedlings", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which task are the robots performing?\nA. cooking dinner\nB. building houses\nC. caring for seedlings\nD. repairing cars", "gt-answer": "C. caring for seedlings", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action are the robots engaged in?\nA. cleaning tables\nB. caring for seedlings\nC. playing chess\nD. cooking meals", "gt-answer": "B. caring for seedlings", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which direction is the closest robotic arm moving from the camera's point of view?\nA. To the right side of the screen\nB. Towards the camera\nC. Away from the camera\nD. To the left side of the screen", "gt-answer": "A. To the right side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What motion can be observed about the closest robotic arm?\nA. Rotating\nB. Moving to the left side of the screen\nC. Oscillating\nD. Moving to the right side of the screen", "gt-answer": "D. Moving to the right side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What kind of movement does the closest robotic arm exhibit?\nA. Shifting to the left side of the screen\nB. Ascending and descending\nC. Shifting to the right side of the screen\nD. Swaying back and forth", "gt-answer": "C. Shifting to the right side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1104673225": { "action": [ { "question": "What is the woman doing in the video?\nA. wrapping up salad\nB. throwing away salad\nC. eating salad\nD. making salad", "gt-answer": "C. eating salad", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in?\nA. wrapping up salad\nB. eating salad\nC. making salad\nD. drinking vegetable juice", "gt-answer": "B. eating salad", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action is the woman involved in?\nA. drinking vegetable juice\nB. making salad\nC. wrapping up salad\nD. eating salad", "gt-answer": "D. eating salad", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100468035": { "direction": [ { "question": "What is the direction of the camera in the video?\nA. zooming backward\nB. zooming forward\nC. tracking right\nD. panning left", "gt-answer": "B. zooming forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction is the camera moving towards?\nA. zooming backward\nB. ascending upward\nC. sliding left\nD. zooming forward", "gt-answer": "D. zooming forward", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "In what manner is the camera moving?\nA. zooming backward\nB. dollying up\nC. zooming forward\nD. tilting down", "gt-answer": "C. zooming forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the door?\nA. remaining closed\nB. closing\nC. gradually opening", "gt-answer": "C. gradually opening", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the door changing?\nA. by gradually opening\nB. by shrinking\nC. by staying the same\nD. by gradually closing", "gt-answer": "A. by gradually opening", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What option best describes the change of the door?\nA. opening\nB. staying closed\nC. staying half-opened\nD. closing", "gt-answer": "A. opening", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "315784": { "speed": [ { "question": "In relation to the speedometer on the left, how does the speedometer in the center appear?\nA. stationary\nB. moving slower\nC. moving faster", "gt-answer": "C. moving faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the relative speed of the speedometer in the center compared to the speedometer on the left?\nA. slower\nB. equal\nC. faster", "gt-answer": "C. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speedometer in the center differ from the speedometer on the left?\nA. moving at the same speed\nB. moving at a slower speed\nC. moving at a faster speed", "gt-answer": "C. moving at a faster speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3411806181": { "action": [ { "question": "What is the person doing in the video?\nA. recharging an electric vehicle\nB. cleaning an electric vehicle\nC. repairing an electric vehicle", "gt-answer": "A. recharging an electric vehicle", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity is the person engaged in?\nA. repairing an EV\nB. cleaning an EV\nC. recharging an EV", "gt-answer": "C. recharging an EV", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the person involved in?\nA. driving an electric vehicle\nB. fueling a car\nC. recharging an electric vehicle\nD. cleaning an electric vehicle", "gt-answer": "C. recharging an electric vehicle", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Which direction is the person moving the charging gun?\nA. Away from the car\nB. Parallel to the car\nC. Towards the car", "gt-answer": "C. Towards the car", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is the person performing on the charging gun?\nA. holding it still\nB. unpluging it from the car\nC. plugging it into the car", "gt-answer": "C. plugging it into the car", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Towards which side is the person moving the charging gun?\nA. himself\nB. the car\nC. none of both", "gt-answer": "B. the car", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "What is the speed of the video?\nA. time-lapse\nB. slow motion\nC. normal speed", "gt-answer": "B. slow motion", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the pace at which the video is playing?\nA. real-time speed\nB. fast forward\nC. slow motion", "gt-answer": "C. slow motion", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "At what rate is the video being played?\nA. slow motion\nB. time-lapse\nC. normal speed", "gt-answer": "A. slow motion", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1043054206": { "speed": [ { "question": "How would you describe the speed of the yellow car compared to other cars?\nA. Stopped\nB. Driving faster than other cars\nC. Driving at the same speed as other cars\nD. Driving slower than other cars", "gt-answer": "B. Driving faster than other cars", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In relation to other cars, how can you characterize the speed of the yellow car?\nA. Traveling at a slower pace than other cars\nB. Traveling at a faster pace than other cars\nC. Currently not in motion\nD. Traveling at an equivalent speed to other cars", "gt-answer": "B. Traveling at a faster pace than other cars", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "When comparing the yellow car to other vehicles, how would you depict its speed?\nA. Moving more slowly than other cars\nB. Moving faster than other cars\nC. Moving at a comparable speed to other cars\nD. Stationary", "gt-answer": "B. Moving faster than other cars", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1096238125": { "action": [ { "question": "What are the man and woman doing in the video?\nA. doing sit-ups\nB. jumping rope\nC. lifting weights\nD. doing push-ups", "gt-answer": "C. lifting weights", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "How would you describe the action performed by the man and woman?\nA. doing push-ups\nB. lifting kettlebell\nC. running\nD. jumping rope", "gt-answer": "B. lifting kettlebell", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which activity are the man and woman engaged in?\nA. playing tennis\nB. doing bench press\nC. lifting kettlebell\nD. doing push-ups", "gt-answer": "C. lifting kettlebell", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "speed": [ { "question": "How is the man lifting the kettlebell compared to the woman?\nA. At roughly the same speed as the woman\nB. Slower\nC. Faster", "gt-answer": "A. At roughly the same speed as the woman", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In terms of speed, how does the man compare to the woman while lifting the kettlebell?\nA. Significantly faster\nB. Significantly slower\nC. Approximately the same", "gt-answer": "C. Approximately the same", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the speed of the man relative to the woman while lifting the kettlebell?\nA. same speed\nB. much faster\nC. much slower", "gt-answer": "A. same speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1103088481": { "action": [ { "question": "What is the person doing in the market?\nA. selling vegetables\nB. packaging vegetables\nC. cooking vegetables\nD. buying vegetables", "gt-answer": "D. buying vegetables", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What activity is the person engaged in at the grocery store?\nA. packaging vegetables\nB. cooking vegetables\nC. selling vegetables\nD. buying vegetables", "gt-answer": "D. buying vegetables", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the individual doing in the video?\nA. buying vegetables\nB. eating vegetables\nC. packaging vegetables\nD. selling vegetables", "gt-answer": "A. buying vegetables", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the correct order of events in the video?\nA. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley\nB. Placing a black vegetables into the trolley and then placing a green vegetables into the trolley\nC. Placing a green vegetables into the trolley, followed by placing a yellow vegetables into the trolley\nD. Placing a red vegetables into the trolley, followed by placing a green vegetables into the trolley", "gt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what sequence are the vegetables being placed in the trolley?\nA. Only a black vegetables\nB. First, a black vegetables and then a green vegetables\nC. First, a green vegetables and then a black vegetables\nD. Only a green vegetables", "gt-answer": "C. First, a green vegetables and then a black vegetables", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action comes second in the video?\nA. Removing a black vegetables from the trolley\nB. Removing a green vegetables from the trolley\nC. Placing a green vegetables into the trolley\nD. Placing a black vegetables into the trolley", "gt-answer": "D. Placing a black vegetables into the trolley", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055981522": { "attribute_change": [ { "question": "What is happening to the 3d shapes?\nA. disappearing\nB. turning into triangles\nC. turning into spheres\nD. turning into cubes", "gt-answer": "C. turning into spheres", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the attribute change of the 3d shapes?\nA. transforming from cubes into spheres\nB. transforming from spheres into cubes\nC. remaining as cubes\nD. remaining as spheres", "gt-answer": "A. transforming from cubes into spheres", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which shape are the 3d shapes transforming into?\nA. cubes\nB. triangles\nC. spheres\nD. pentagons", "gt-answer": "C. spheres", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1061017846": { "speed": [ { "question": "What is the speed of the boat on the top of the screen?\nA. slower than the boat on the bottom of the screen\nB. faster than the boat on the bottom of the screen\nC. travels at the same speed as the boat on the bottom of the screen", "gt-answer": "C. travels at the same speed as the boat on the bottom of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Is the boat on the top of the screen moving at a different speed compared to the boat on the bottom of the screen?\nA. no, it's moving at the same speed\nB. yes, it's moving faster\nC. yes, it's moving slower", "gt-answer": "A. no, it's moving at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How would you describe the speed of the boat on the top of the screen compared to the boat on the bottom of the screen?\nA. equal speed\nB. significantly faster\nC. slightly faster", "gt-answer": "A. equal speed", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1097341567": { "order": [ { "question": "In what order do the events occur in the video?\nA. The arrow appears, then the bars appear\nB. The bars appear, then the arrow appears\nC. They both appear at the same time", "gt-answer": "B. The bars appear, then the arrow appears", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the first event that occurs in the video?\nA. The bars appear\nB. The arrow appears\nC. The bars and the arrow appear at the same time", "gt-answer": "A. The bars appear", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the second event that occurs in the video?\nA. The bars appear\nB. The arrow appears\nC. The bars and the arrow appear at the same time", "gt-answer": "B. The arrow appears", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1056433484": { "direction": [ { "question": "What is the direction of the Earth's motion around the Sun?\nA. Counter-clockwise\nB. Clockwise\nC. Upwards", "gt-answer": "A. Counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction does the Earth travel in its orbit around the Sun?\nA. Clockwise\nB. Counter-clockwise\nC. Vertical", "gt-answer": "B. Counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "The Earth's rotation in relation to the Sun follows a ____________ direction.\nA. Counter-clockwise\nB. Clockwise\nC. Horizontal", "gt-answer": "A. Counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed of the earth's rotation compared to the sun?\nA. Faster than the sun\nB. Slower than the sun\nC. The same as the sun", "gt-answer": "A. Faster than the sun", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which statement accurately describes the earth's speed compared to the sun?\nA. The earth rotates slower than the sun\nB. The earth rotates faster than the sun\nC. They rotate at equal speeds", "gt-answer": "B. The earth rotates faster than the sun", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In terms of speed, how does the earth's rotation compare to the sun?\nA. The sun rotates slower than the earth\nB. The sun rotates faster than the earth\nC. The earth rotates faster than the sun", "gt-answer": "C. The earth rotates faster than the sun", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1073914229": { "direction": [ { "question": "What direction are the trains moving?\nA. in the same direction\nB. towards each other\nC. away from each other", "gt-answer": "B. towards each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what manner are the trains traveling?\nA. stopped\nB. in the same direction\nC. towards each other\nD. away from each other", "gt-answer": "C. towards each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the trajectory of the trains?\nA. perpendicular to each other\nB. moving away from each other\nC. proceeding in the same way\nD. moving towards each other", "gt-answer": "D. moving towards each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1099360359": { "speed": [ { "question": "Which train drives faster?\nA. The train closer to the screen\nB. There is no information about their speeds\nC. They both drive at the same speed\nD. The train further away from the screen", "gt-answer": "D. The train further away from the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the relative speed between the two trains?\nA. There is no information about their speeds\nB. They both drive at the same speed\nC. The train closer to the screen drives faster\nD. The train further away from the screen drives faster", "gt-answer": "D. The train further away from the screen drives faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "According to the video, which train has a higher speed?\nA. The train further away from the screen\nB. They both drive at the same speed\nC. There is no information about their speeds\nD. The train closer to the screen", "gt-answer": "A. The train further away from the screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1098970151": { "action": [ { "question": "What is the cat doing in the video?\nA. licking its paw\nB. washing its face\nC. waving its paw\nD. licking its belly", "gt-answer": "A. licking its paw", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which body part of the cat is it licking?\nA. nose\nB. ears\nC. paws\nD. tail", "gt-answer": "C. paws", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the cat doing with its paw?\nA. licking its paw\nB. waving its paw\nC. watching its paw\nD. biting its paw", "gt-answer": "A. licking its paw", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1081734740": { "attribute_change": [ { "question": "What is happening to the texture of the leaf?\nA. It is turning from green to yellow\nB. It is turning from white to green\nC. It is turning from green to white\nD. It is turning from yellow to green", "gt-answer": "A. It is turning from green to yellow", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What color is the leaf turning into?\nA. White\nB. Green\nC. Yellow", "gt-answer": "C. Yellow", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What change is occurring in the leaf?\nA. It is getting smaller\nB. It is becoming white\nC. It is becoming yellow\nD. It is becoming green", "gt-answer": "C. It is becoming yellow", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1093719871": { "attribute_change": [ { "question": "What is happening to the pink flowers?\nA. growing taller\nB. falling off petals\nC. turning from withered to full blossom\nD. turning from full blossom to withered", "gt-answer": "C. turning from withered to full blossom", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "How are the pink flowers transforming?\nA. from small buds to big flowers\nB. from full blossom to withered\nC. from half-open to closed\nD. from withered to full blossom", "gt-answer": "D. from withered to full blossom", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the final appearance of the pink flowers?\nA. small buds\nB. died petals\nC. fresh leaves\nD. fully bloomed", "gt-answer": "D. fully bloomed", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1042819039": { "speed": [ { "question": "What is the speed of the video?\nA. slow motion\nB. time-lapse\nC. normal speed", "gt-answer": "B. time-lapse", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the pace at which the video is playing?\nA. normal speed\nB. slow motion\nC. fast forward", "gt-answer": "C. fast forward", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In what manner is the video being shown?\nA. in real-time\nB. in time-lapse\nC. in slow motion", "gt-answer": "B. in time-lapse", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "In what order did the events occur?\nA. The street was filled with people, then it was filled with vehicles\nB. The street was filled with vehicles, then it was empty\nC. The street was filled with vehicles, then it was filled with people\nD. The street was filled with people, then it was empty", "gt-answer": "A. The street was filled with people, then it was filled with vehicles", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What happened first in the video?\nA. The street was filled with vehicles\nB. The street was filled with people\nC. Both events occurred simultaneously", "gt-answer": "B. The street was filled with people", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What happened second in the video?\nA. The street was filled with vehicles\nB. Both events occurred simultaneously\nC. The street was filled with people", "gt-answer": "A. The street was filled with vehicles", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1093139559": { "direction": [ { "question": "What is the type of camera motion in the video? \nA. Zooming into three football players\nB. Panning left\nC. Panning right\nD. Zooming out from three football palyers", "gt-answer": "A. Zooming into three football players", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the camera moving? \nA. Zooming in\nB. Upwards\nC. Zooming out\nD. Downwards", "gt-answer": "A. Zooming in", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which option best describes the camera's motion? \nA. Tilting upwards\nB. Zooming forward\nC. Zooming backward\nD. Standing still", "gt-answer": "B. Zooming forward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the light condition on the football players?\nA. staying the same\nB. turning darker\nC. turning brighter", "gt-answer": "C. turning brighter", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "How would you describe the change in light on the football players?\nA. dimming\nB. flickering\nC. intensifying", "gt-answer": "C. intensifying", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which statement accurately describes the change on the football players?\nA. becoming blurry\nB. becoming more visible\nC. becoming dimmer", "gt-answer": "B. becoming more visible", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055973887": { "attribute_change": [ { "question": "What is happening to the fire ball? \nA. staying the same size\nB. getting smaller\nC. getting larger", "gt-answer": "C. getting larger", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "How is the fire ball changing? \nA. splitting in half\nB. expanding out\nC. contracting into the center", "gt-answer": "B. expanding out", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In what way is the fire ball transforming? \nA. changing into a cube size\nB. shrinking in size\nC. growing in size", "gt-answer": "C. growing in size", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1098710341": { "action": [ { "question": "What is the person doing in the video?\nA. drinking water from a glass\nB. pouring water into a glass\nC. washing hands with water\nD. spilling water on the floor", "gt-answer": "B. pouring water into a glass", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action is the person performing?\nA. drinking water from a glass\nB. stirring water in a bowl\nC. pouring water into a glass\nD. adding water into a pot", "gt-answer": "C. pouring water into a glass", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is being performed by the person?\nA. washing hands with water\nB. spilling water on the floor\nC. drinking water from a glass\nD. pouring water into a glass", "gt-answer": "D. pouring water into a glass", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the glass?\nA. It is changing color\nB. It is going from full of water to empty\nC. It is going from empty to full of water\nD. It is transforming into a different shape", "gt-answer": "C. It is going from empty to full of water", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the final state of the glass?\nA. It is broken into pieces\nB. It is about 70% full with water\nC. It is half full with water\nD. It is empty", "gt-answer": "B. It is about 70% full with water", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In whay way is the glass changing?\nA. Water was disappearing from the glass\nB. The glass was heated\nC. Water was poured into the glass\nD. A chemical reaction occurred in the glass", "gt-answer": "C. Water was poured into the glass", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1062736174": { "action": [ { "question": "What is the chef doing in the video?\nA. chopping steak\nB. sprinkling vegetables on steak\nC. sprinkling salt on steak\nD. grilling steak", "gt-answer": "C. sprinkling salt on steak", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action is the chef performing on the steak?\nA. flipping the steak\nB. pouring water\nC. sprinkling salt\nD. seasoning with pepper", "gt-answer": "C. sprinkling salt", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the chef's activity related to the steak?\nA. marinating with spices\nB. sprinkling salt on it\nC. cutting into slices\nD. serving with salad", "gt-answer": "B. sprinkling salt on it", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1099116143": { "attribute_change": [ { "question": "What is happening to the pink liquid?\nA. White foam disappears from the surface\nB. White foam appears on the surface\nC. It is freezing\nD. It is evaporating", "gt-answer": "B. White foam appears on the surface", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be observed visually on the pink liquid?\nA. White foam appears on the surface\nB. The liquid is turning transparent\nC. White foam disappears from the surface", "gt-answer": "A. White foam appears on the surface", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the appearance of the pink liquid affected?\nA. White foam appears on the surface\nB. It becomes blue\nC. White foam disappears from the surface\nD. It becomes green", "gt-answer": "A. White foam appears on the surface", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1108398787": { "action": [ { "question": "What type of action is the person performing?\nA. Chatting on a smartphone device\nB. Operating system settings on a smartphone device\nC. Watching videos on a smartphone device\nD. Playing games on a smartphone device", "gt-answer": "B. Operating system settings on a smartphone device", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity is the person engaged in?\nA. Watching videos on a smartphone device\nB. Making a phone call using a smartphone device\nC. Operating system settings on a smartphone device\nD. Chatting on a smartphone device", "gt-answer": "C. Operating system settings on a smartphone device", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the person doing with the smartphone?\nA. Listening to music\nB. Watching a movie\nC. Texting a friend\nD. Operating system settings", "gt-answer": "D. Operating system settings", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of the events that the person is performing?\nA. Scrolling down and then entering passwords\nB. Entering passwords and then scrolling down\nC. Scrolling up and then entering passwords\nD. Entering passwords and then scrolling up", "gt-answer": "A. Scrolling down and then entering passwords", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which order are the events occurring for the person?\nA. Entering passwords and then scrolling down\nB. Entering passwords and then scrolling up\nC. Scrolling down and then entering passwords\nD. Scrolling up and then entering passwords", "gt-answer": "C. Scrolling down and then entering passwords", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the person performing the actions?\nA. Scrolling down and then entering passwords\nB. Scrolling up and then entering passwords\nC. Entering passwords and then scrolling down\nD. Entering passwords and then scrolling up", "gt-answer": "A. Scrolling down and then entering passwords", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1080591311": { "direction": [ { "question": "What direction is the jellyfish moving?\nA. moving towards the right\nB. floating upwards\nC. moving towards the left\nD. sinking downwards", "gt-answer": "B. floating upwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of motion for the jellyfish?\nA. floating to the right\nB. floating to the left\nC. floating downwards\nD. floating upwards", "gt-answer": "D. floating upwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the jellyfish moving?\nA. going down\nB. going away from the screen\nC. going towards the screen\nD. going up", "gt-answer": "D. going up", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1107034223": { "action": [ { "question": "What is the bear doing in the river?\nA. swimming\nB. climbing trees\nC. sleeping\nD. catching fishes", "gt-answer": "D. catching fishes", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which activity is the bear engaged in?\nA. hibernating\nB. eating\nC. fishing\nD. running", "gt-answer": "C. fishing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the main action of the bear?\nA. climbing rocks\nB. drinking water\nC. catching fishes\nD. roaring", "gt-answer": "C. catching fishes", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events involving the bear?\nA. Turning back and then catching a fish\nB. Running forward and then catching a fish\nC. Catching a fish and then swallow it\nD. Catching a fish and then turning back", "gt-answer": "D. Catching a fish and then turning back", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What was the sequential arrangement of events for the bear?\nA. Catching a fish and then climbing up a tree\nB. Turning back and then catching a fish\nC. Catching a fish and then turning back\nD. Jumping into the water and then catching a fish", "gt-answer": "C. Catching a fish and then turning back", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first about the bear?\nA. Catching a fish\nB. Jumping out of water\nC. Falling over\nD. Turning back", "gt-answer": "A. Catching a fish", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1025623079": { "attribute_change": [ { "question": "What is happening to the skyscraper?\nA. lighting up\nB. growing taller\nC. in construction\nD. collapsing", "gt-answer": "D. collapsing", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the condition of the skyscraper?\nA. in construction\nB. collapsing\nC. being eracted\nD. burning in fire", "gt-answer": "B. collapsing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What change is occurring with the skyscraper?\nA. burning in fire\nB. collapsing\nC. standing up\nD. turning darker", "gt-answer": "B. collapsing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1094782389": { "action": [ { "question": "What action is the dog performing in the video?\nA. Running towards a woman\nB. Jumping towards a woman\nC. Barking to a woman\nD. Giving a high five to a woman", "gt-answer": "D. Giving a high five to a woman", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity is the dog engaged in?\nA. Catching food from a woman\nB. Giving a high five to a woman\nC. Wagging its tail at a woman\nD. Licking a woman", "gt-answer": "B. Giving a high five to a woman", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action did the dog execute?\nA. Licking the woman\nB. Fetching a ball thrown by the woman\nC. Digging a hole\nD. Giving a high five to the woman", "gt-answer": "D. Giving a high five to the woman", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3411228673": { "direction": [ { "question": "What is the direction of the movement in the video?\nA. sideways along the skyscraper buildings\nB. upwards among skyscraper buildings\nC. downwards towards the ground", "gt-answer": "B. upwards among skyscraper buildings", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the camera moving?\nA. backwards\nB. forwards\nC. downwards\nD. upwards", "gt-answer": "D. upwards", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the path of movement in the video?\nA. flying downwards\nB. flying forwards\nC. flying backwards\nD. flying upwards", "gt-answer": "D. flying upwards", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1043487715": { "action": [ { "question": "What are the children doing in the video?\nA. diving into water\nB. eating\nC. sleeping", "gt-answer": "A. diving into water", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which activity can be seen in the video involving the children?\nA. hiking\nB. dancing\nC. diving into water", "gt-answer": "C. diving into water", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the primary action performed by the children?\nA. rowing a boat\nB. diving into water\nC. cooking", "gt-answer": "B. diving into water", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events in the video involving the children?\nA. diving into water and then making gestures to the camera\nB. making gestures to the camera and then diving into water", "gt-answer": "A. diving into water and then making gestures to the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What are the children doing first in the video?\nA. leaving the swimming pool\nB. diving into water\nC. making gestures to the camera", "gt-answer": "B. diving into water", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which event happens secondly in the video featuring the children?\nA. diving into water\nB. swimming around\nC. making gestures to the camera", "gt-answer": "C. making gestures to the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1093737353": { "direction": [ { "question": "What type of motion is the camera performing in the video?\nA. panning to the right\nB. panning to the left\nC. tilting up\nD. zooming in", "gt-answer": "A. panning to the right", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the camera moving?\nA. downwards\nB. rightwards\nC. leftwards\nD. upwards", "gt-answer": "B. rightwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of the camera's movement?\nA. panning to the left\nB. panning to the right\nC. backwards\nD. forwards", "gt-answer": "B. panning to the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the order that the equipments are shown in the video?\nA. A microscope and then a beaker\nB. A beaker and then a line of test tubes\nC. A beaker and then a microscope\nD. A line of test tubes and then a beaker", "gt-answer": "D. A line of test tubes and then a beaker", "video-llm-prediction": "A. A microscope and then a beaker", "match_success": true, "rating": 0 }, { "question": "What is shown in the video first?\nA. A beaker\nB. A microscope\nC. A line of test tubes", "gt-answer": "C. A line of test tubes", "video-llm-prediction": "A. A beaker", "match_success": true, "rating": 0 }, { "question": "What is shown in the video later?\nA. A beaker\nB. A microscope\nC. A line of test tubes", "gt-answer": "A. A beaker", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1063373449": { "attribute_change": [ { "question": "What is happening to the coronavirus?\nA. replicating itself\nB. mutating into a new strain\nC. assembling together\nD. dissolving under the attack of antibodies", "gt-answer": "D. dissolving under the attack of antibodies", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the coronavirus responding to antibodies?\nA. replicating itself\nB. dissolving under their attack\nC. avoiding them by hiding in cells\nD. assembling together", "gt-answer": "B. dissolving under their attack", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What occurs to the coronavirus?\nA. it assembles together\nB. it grows larger\nC. it dissolves\nD. it replicates", "gt-answer": "C. it dissolves", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1017768724": { "direction": [ { "question": "What is the direction of the person's movement?\nA. moving upwards\nB. moving leftwards\nC. moving downwards\nD. moving rightwards", "gt-answer": "D. moving rightwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the person heading?\nA. vertically\nB. backward\nC. forward\nD. horizontally", "gt-answer": "D. horizontally", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "How is the person moving?\nA. moving rightwards\nB. jumping upwards\nC. moving leftwards\nD. running forwards", "gt-answer": "A. moving rightwards", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1106280325": { "action": [ { "question": "What is the woman doing?\nA. hiking\nB. playing guitar\nC. reading book\nD. dancing", "gt-answer": "C. reading book", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in?\nA. painting a picture\nB. playing guitar\nC. sleeping\nD. reading book", "gt-answer": "D. reading book", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What can be seen in the video?\nA. woman reading book on the grass\nB. woman sleeping on the grass\nC. woman hiking in the wild\nD. woman drinking water ", "gt-answer": "A. woman reading book on the grass", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events in the video?\nA. A girl is shown reading a book and a body of water is shown simultaneously\nB. A girl is shown reading a book, then a body of water is shown\nC. A body of water is shown, then a girl is shown reading a book", "gt-answer": "B. A girl is shown reading a book, then a body of water is shown", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What happens first in the video?\nA. Both events happen at the same time\nB. A body of water is shown\nC. A girl is shown reading a book", "gt-answer": "C. A girl is shown reading a book", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which event appears second in the video?\nA. A girl is shown reading a book\nB. Both events appear at the same time\nC. A body of water is shown", "gt-answer": "C. A body of water is shown", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100117263": { "direction": [ { "question": "What is the direction of the little lion's motion?\nA. downward\nB. upward\nC. towards the camera\nD. rightward", "gt-answer": "A. downward", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the little lion doing?\nA. sitting nearby an adult lion\nB. sitting on the back of an adult lion\nC. falling from the back of an adult lion\nD. jumping onto the back of an adult lion", "gt-answer": "C. falling from the back of an adult lion", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction is the little lion going?\nA. falling down\nB. climbing up\nC. walking forward\nD. walking backward", "gt-answer": "A. falling down", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "15695290": { "action": [ { "question": "What is the person doing?\nA. playing soccer\nB. reading a book\nC. drawing a picture", "gt-answer": "C. drawing a picture", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the person engaged in?\nA. drawing a picture\nB. dancing\nC. cooking", "gt-answer": "A. drawing a picture", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the main task of the person?\nA. typing on the computer\nB. painting a wall\nC. drawing a picture", "gt-answer": "C. drawing a picture", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events in the video?\nA. A house is drawn, then a family of people is drawn\nB. A family of people is drawn, then a house is drawn\nC. The house and the family are drawn simultaneously", "gt-answer": "A. A house is drawn, then a family of people is drawn", "video-llm-prediction": "A. A house is drawn, then a family of people is drawn", "match_success": true, "rating": 1 }, { "question": "Which event occurs before the other in the video?\nA. Both events occur simultaneously\nB. The family of people being drawn occurs before the house being drawn\nC. The house being drawn occurs before the family of people being drawn", "gt-answer": "C. The house being drawn occurs before the family of people being drawn", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the chronological order of the events in the video?\nA. The house is drawn first, then the family of people is drawn\nB. The family of people is drawn first, then the house is drawn\nC. Both events happen at the same time", "gt-answer": "A. The house is drawn first, then the family of people is drawn", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1091090295": { "order": [ { "question": "In what order do the events occur in the video?\nA. A bird flying onto the back of a hippo, then a hippo pokes its head out of water\nB. The events happen simultaneously\nC. A hippo pokes its head out of water, then a bird flying onto the back of a hippo", "gt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What event happens first in the video?\nA. A bird flying onto the back of a hippo\nB. A bird flying away from the back of a hippo\nC. A hippo pokes its head out of water\nD. A hippo puts its head into water", "gt-answer": "A. A bird flying onto the back of a hippo", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What event happens second in the video?\nA. A hippo puts its head into water\nB. A bird flying away from the back of a hippo\nC. A bird flying onto the back of a hippo\nD. A hippo pokes its head out of water", "gt-answer": "D. A hippo pokes its head out of water", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1021488277": { "direction": [ { "question": "What is happening in the video? \nA. A person drops down the pineapple\nB. A person pushes forward the pineapple\nC. A person rotates the pineapple\nD. A person picks up the pineapple", "gt-answer": "D. A person picks up the pineapple", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What action is taking place in the video?\nA. The pineapple is being dropped by a person.\nB. The pineapple is being rotated by a person.\nC. The pineapple is being pushed forward by a person.\nD. The pineapple is being picked up by a person.", "gt-answer": "D. The pineapple is being picked up by a person.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be observed in the video?\nA. The pineapple is rotated by a person.\nB. The pineapple is pushed in a forward direction.\nC. The pineapple is lifted by an individual.\nD. The pineapple is released and falls downward.", "gt-answer": "C. The pineapple is lifted by an individual.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1106899445": { "action": [ { "question": "What action is the person performing with the toothbrush?\nA. brushing teeth\nB. removing toothpaste from the toothbrush\nC. squeezing out toothpaste on the toothbrush", "gt-answer": "C. squeezing out toothpaste on the toothbrush", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the main action of the person in the video?\nA. removing toothpaste from the toothbrush\nB. brushing teeth\nC. squeezing out toothpaste on a toothbrush", "gt-answer": "C. squeezing out toothpaste on a toothbrush", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What happens in the video?\nA. a person is brushing teeth using the toothbrush\nB. toothpaste being washed from a toothbrush\nC. toothpaste being squeezed on a toothbrush", "gt-answer": "C. toothpaste being squeezed on a toothbrush", "video-llm-prediction": "A. a person is brushing teeth using the toothbrush", "match_success": true, "rating": 0 } ] }, "1067925569": { "order": [ { "question": "What is the order of events in the video?\nA. First, a container ship is shown, then a cargo train is shown\nB. First, a cargo train is shown, then a container ship is shown\nC. The cargo train and the container ship are shown simultaneously", "gt-answer": "A. First, a container ship is shown, then a cargo train is shown", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what sequence are the events presented in the video?\nA. Firstly, a container ship is shown, secondly a cargo train is shown\nB. Firstly, a cargo train is shown, secondly a container ship is shown\nC. The cargo train and the container ship are shown at the same time", "gt-answer": "A. Firstly, a container ship is shown, secondly a cargo train is shown", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event comes after the other in the video?\nA. A cargo train is shown after a container truck is shown\nB. A container ship is shown after a cargo train is shown\nC. A cargo train is shown after a container ship is shown\nD. A container truck is shown before a cargo train is shown", "gt-answer": "C. A cargo train is shown after a container ship is shown", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1062609286": { "attribute_change": [ { "question": "What is happening to the battery charge?\nA. decreasing\nB. staying constant\nC. increasing", "gt-answer": "C. increasing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the battery charge changing?\nA. increasing\nB. random\nC. decreasing", "gt-answer": "A. increasing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which option describes the change of the battery charge?\nA. decreasing\nB. increasing\nC. staying the same", "gt-answer": "B. increasing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100397435": { "action": [ { "question": "What is the person doing in the video?\nA. turning off the robot vacuum cleaner\nB. starts the robot vacuum cleaner\nC. fixing the robot vacuum cleaner", "gt-answer": "B. starts the robot vacuum cleaner", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What action does the person perform?\nA. sweeping the floor\nB. starts the robot vacuum cleaner\nC. turning off the robot vacuum cleaner", "gt-answer": "B. starts the robot vacuum cleaner", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity does the person engage in?\nA. taking apart the robot vacuum cleaner\nB. recharging the robot vacuum cleaner\nC. starts the robot vacuum cleaner", "gt-answer": "C. starts the robot vacuum cleaner", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "What direction is the robot vacuum cleaner moving in the video?\nA. to the right side of the screen\nB. to the left side of the screen\nC. towards the screen\nD. away from the screen", "gt-answer": "A. to the right side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the movement pattern of the robot vacuum cleaner?\nA. straight line towards the screen\nB. straight line to the right side of the screen\nC. straight line to the left side of the screen\nD. straight line away from the screen", "gt-answer": "B. straight line to the right side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Where is the robot vacuum cleaner heading?\nA. to the lower side of the screen\nB. to the upper side of the screen\nC. to the left side of the screen\nD. to the right side of the screen", "gt-answer": "D. to the right side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "order": [ { "question": "What is the order of events in the video?\nA. A person enters the screen and then the robot vacuum cleaner starts moving\nB. The robot vacuum cleaner starts moving and then a person enters the screen", "gt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What happens first in the video?\nA. A person enters the screen\nB. The robot vacuum cleaner starts moving", "gt-answer": "A. A person enters the screen", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What happens second in the video?\nA. A person enters the screen\nB. The robot vacuum cleaner starts moving", "gt-answer": "B. The robot vacuum cleaner starts moving", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1108534143": { "direction": [ { "question": "What is the puppy doing in the video?\nA. staying in a wigwam\nB. walking into a wigwam\nC. walking out of a wigwam", "gt-answer": "C. walking out of a wigwam", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the puppy moving?\nA. walking out of a wigwam\nB. entring a wigwam\nC. walking around a wigwam", "gt-answer": "A. walking out of a wigwam", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is the puppy taking?\nA. entring a wigwam\nB. walking out of a wigwam\nC. walking around a wigwam", "gt-answer": "B. walking out of a wigwam", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1034049020": { "action": [ { "question": "What is the woman doing in the video?\nA. cleaning a wall while walking\nB. standing still and painting a wall\nC. painting a wall while walking", "gt-answer": "C. painting a wall while walking", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is taking place in the video?\nA. a girl standing and cleaning a wall\nB. a girl is walking and cleaning a wall\nC. a girl painting a wall while walking", "gt-answer": "C. a girl painting a wall while walking", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following actions is the woman performing?\nA. standing still and painting a wall\nB. standing and cleaning a wall\nC. painting a wall while walking", "gt-answer": "C. painting a wall while walking", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events?\nA. Turning back and painting the wall, then walking\nB. Turning back, then painting a wall while walking\nC. Painting a wall while walking, then turning back", "gt-answer": "C. Painting a wall while walking, then turning back", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which order are the events occurring?\nA. Turning back first and later painting a wall while walking\nB. Painting a wall while walking, then turning back\nC. Turning back and painting the wall, then walking", "gt-answer": "B. Painting a wall while walking, then turning back", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What happens later to the woman?\nA. painting a wall\nB. sitting down\nC. turning back", "gt-answer": "C. turning back", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1047368344": { "direction": [ { "question": "What is the girl doing?\nA. jumping into water\nB. jumping around water\nC. swimming in the water\nD. jumping out of water", "gt-answer": "A. jumping into water", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the girl moving?\nA. towards the camera\nB. towards the water\nC. away from the water", "gt-answer": "B. towards the water", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the girl moving?\nA. towards the water\nB. away from the water\nC. inside the water", "gt-answer": "A. towards the water", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events for the girl?\nA. putting on clothes and then jumping into water\nB. taking off clothes and then jumping into water\nC. jumping into water and then putting on clothes\nD. jumping into water and then taking off clothes", "gt-answer": "B. taking off clothes and then jumping into water", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event comes first for the girl?\nA. taking off clothes\nB. jumping into water\nC. putting on clothes", "gt-answer": "A. taking off clothes", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the sequence of actions performed by the girl?\nA. putting on clothes, jumping into water, taking off clothes\nB. jumping into water, putting on clothes, taking off clothes\nC. taking off clothes, putting on clothes, jumping into water", "gt-answer": "C. taking off clothes, putting on clothes, jumping into water", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1060403198": { "attribute_change": [ { "question": "What is happening to the tree?\nA. increasing height\nB. decreasing height\nC. shedding leaves\nD. changing color", "gt-answer": "A. increasing height", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which attribute of the tree is undergoing a transformation?\nA. position\nB. height\nC. color", "gt-answer": "B. height", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What term can be used to describe the change happening to the tree?\nA. wilting\nB. growing in size\nC. falling down\nD. reducing in size", "gt-answer": "B. growing in size", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1100074677": { "order": [ { "question": "What is the order of the events performed by the person?\nA. throwing the paper note away and then tearing it apart\nB. tearing apart the paper note and then throwing it away\nC. standing the paper note up and then writing something on the paper note\nD. writing something on the paper note and then standing the paper note up", "gt-answer": "D. writing something on the paper note and then standing the paper note up", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence did the person perform the actions?\nA. writing something on the paper note and then tearing it apart\nB. standing the paper note up and then writing something on the paper note\nC. throwing the paper note away and then standing the paper note up\nD. throwing the paper note away and then tearing it apart", "gt-answer": "B. standing the paper note up and then writing something on the paper note", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How did the person arrange the actions in order?\nA. standing the paper note up and then writing something on it\nB. tearing apart the paper note and then standing it up\nC. throwing away the paper note and then tearing it apart\nD. writing something on the paper note and then throwing it away", "gt-answer": "A. standing the paper note up and then writing something on it", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1100350201": { "order": [ { "question": "What is the order of events in the video?\nA. The man is drawn and then the little girl is drawn\nB. The man is drawn first, then the little girl disappears and is drawn\nC. The little girl is drawn and then the man is drawn\nD. The little girl is drawn first, then the man gets erased and drawn", "gt-answer": "C. The little girl is drawn and then the man is drawn", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video?\nA. The man is drawn and then the little girl disappears\nB. The little girl is drawn first, then the man disappears\nC. The little girl is drawn and then the man is drawn\nD. The man is drawn first, then the little girl appears", "gt-answer": "C. The little girl is drawn and then the man is drawn", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs first in the video?\nA. The man is drawn\nB. The man is erased\nC. The little girl is erased\nD. The little girl is drawn", "gt-answer": "D. The little girl is drawn", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1099109715": { "attribute_change": [ { "question": "What is happening to the number of fruits and vegetables?\nA. becoming rotten\nB. increasing\nC. decreasing\nD. staying the same", "gt-answer": "B. increasing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the change to the fruits and vegetables?\nA. disappearing\nB. increasing number\nC. staying the same\nD. decaying", "gt-answer": "B. increasing number", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which is the most accurate statement about the number of fruits and vegetables?\nA. It is getting bigger.\nB. It is getting smaller.\nC. It is changing sporadically.\nD. It is remaining constant.", "gt-answer": "A. It is getting bigger.", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1051211272": { "attribute_change": [ { "question": "What is happening to the toast with cream cheese?\nA. gradually reappearing piece by piece\nB. staying the same size\nC. gradually being eaten out and disappearing", "gt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What alteration is taking place with the cream cheese-covered toast?\nA. Gradually emerging piece by piece\nB. Remaining constant in size\nC. Slowly diminishing as it is consumed", "gt-answer": "C. Slowly diminishing as it is consumed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the outcome of the toast with cream cheese?\nA. it gradually reappears piece by piece\nB. it gradually disappears piece by piece\nC. it gradually spoils", "gt-answer": "B. it gradually disappears piece by piece", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059815936": { "attribute_change": [ { "question": "What is happening to the paper?\nA. changing from a wrinkled paper ball into a flattened sheet\nB. changing from a flattened sheet into scraps of paper\nC. changing from a flattened sheet into a wrinkled paper ball", "gt-answer": "A. changing from a wrinkled paper ball into a flattened sheet", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the paper transform?\nA. crumpling into a ball\nB. tearing apart\nC. unfolding", "gt-answer": "C. unfolding", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the main change occurring in the paper?\nA. changing teared apart\nB. being folded\nC. being flattened out", "gt-answer": "C. being flattened out", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086423566": { "order": [ { "question": "What is the order of events in the video?\nA. The bowl rotates and then food is added into the bowl\nB. Food is added into the bowl and then the bowl rotates\nC. The bowl flips upside down and then food is added into the bowl\nD. Food is added into the bowl and then the bowl flips upside down", "gt-answer": "B. Food is added into the bowl and then the bowl rotates", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video?\nA. Food is added into the bowl and then the bowl rotates\nB. The bowl rotates and then food is added into the bowl\nC. Food is added into the bowl and then it disappears\nD. The bowl spins around and food flies out of the bowl", "gt-answer": "A. Food is added into the bowl and then the bowl rotates", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the correct order of actions in the video?\nA. Food is thrown into the air and then falls into the bowl\nB. The bowl rotates and then food is added into the bowl\nC. Food is piled up inside the bowl and then the bowl rotates\nD. The bowl splits into two halves and then food is added into one half", "gt-answer": "C. Food is piled up inside the bowl and then the bowl rotates", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1069611487": { "order": [ { "question": "In which order do the events occur in the video?\nA. Pizza slices disappear, then a paper box appears\nB. Pizza slices appear, then a paper box appears\nC. A paper box appears, then pizza slices disappear", "gt-answer": "C. A paper box appears, then pizza slices disappear", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What happened first in the video?\nA. Pizza slices disappear\nB. A paper box appears\nC. A paper box disappears", "gt-answer": "B. A paper box appears", "video-llm-prediction": "A. Pizza slices disappear", "match_success": true, "rating": 0 }, { "question": "What happened last in the video?\nA. Pizza slices being placed on the paper box\nB. Pizza slices being taken away\nC. A paper box appears", "gt-answer": "B. Pizza slices being taken away", "video-llm-prediction": "A. Pizza slices being placed on the paper box", "match_success": true, "rating": 0 } ] }, "1100329207_reverse": { "direction": [ { "question": "What is the direction of the camera view?\nA. moving right\nB. moving backward\nC. moving left\nD. moving forward", "gt-answer": "B. moving backward", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "In which direction is the video panning?\nA. up\nB. down\nC. backward\nD. forward", "gt-answer": "C. backward", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the direction of the camera movement?\nA. moving forward\nB. tilting up\nC. tilting down\nD. moving backward", "gt-answer": "D. moving backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1089201973_reverse": { "direction": [ { "question": "What is the direction of the football in the video?\nA. moving from left to right\nB. moving from right to left\nC. stationary", "gt-answer": "B. moving from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the football traveling?\nA. Rightwards\nB. Upwards\nC. Leftwards\nD. Downwards", "gt-answer": "C. Leftwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the path of the football?\nA. from bottom to top\nB. from right to left\nC. from left to right\nD. from top to bottom", "gt-answer": "B. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1034736653_reverse": { "direction": [ { "question": "In which direction are the woman athletes running?\nA. from right to left\nB. in circles\nC. from left to right", "gt-answer": "A. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "From which side are the woman athletes entering the screen?\nA. right\nB. top\nC. left\nD. bottom", "gt-answer": "A. right", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which way are the woman athletes heading?\nA. from left to right\nB. away from the camera\nC. from right to left\nD. towards the camera", "gt-answer": "C. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1084153195_reverse": { "direction": [ { "question": "What is the movement of the dolphins?\nA. swimming towards the shore\nB. hovering in one place\nC. swimming away from the shore", "gt-answer": "C. swimming away from the shore", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction are the dolphins swimming?\nA. parallel to the shore\nB. towards the shore\nC. away from the shore", "gt-answer": "C. away from the shore", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "If you observe the dolphins, what direction would you notice them heading?\nA. towards the shore\nB. parallel to the shore\nC. away from the shore", "gt-answer": "C. away from the shore", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1081092839_reverse": { "direction": [ { "question": "What is the direction of the sun?\nA. descending\nB. ascending\nC. moving sideways", "gt-answer": "B. ascending", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement pattern of the sun?\nA. falling\nB. rising\nC. remaining still", "gt-answer": "B. rising", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the movement direction of the sun?\nA. descending\nB. ascending\nC. rotating", "gt-answer": "B. ascending", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction does the sun travel during sunset?\nA. downwards\nB. upwards\nC. horizontally", "gt-answer": "B. upwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059462749_reverse": { "direction": [ { "question": "In which direction is the person moving?\nA. rightwards\nB. downwards\nC. upwards\nD. leftwards", "gt-answer": "C. upwards", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What word describes the movement of the person?\nA. standing\nB. descending\nC. climbing up\nD. jumping", "gt-answer": "C. climbing up", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "From a higher point to a lower point, the person is:\nA. rotating\nB. rising\nC. staying still\nD. descending", "gt-answer": "B. rising", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1088279109_reverse": { "direction": [ { "question": "What is the elevator doing?\nA. rising\nB. going down\nC. staying still", "gt-answer": "B. going down", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the elevator moving?\nA. up\nB. down\nC. not moving", "gt-answer": "B. down", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of the elevator's movement?\nA. descending\nB. ascending\nC. stationary", "gt-answer": "A. descending", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which way is the elevator going?\nA. up\nB. down\nC. stopped", "gt-answer": "B. down", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1096612823_reverse": { "direction": [ { "question": "What is happening to the video?\nA. zooming out\nB. rotating\nC. panning left\nD. zooming in", "gt-answer": "A. zooming out", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the direction of the video?\nA. panning right\nB. fading out\nC. zooming in\nD. moving backward", "gt-answer": "D. moving backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the video changing?\nA. panning upwards\nB. rewinding\nC. zooming out\nD. zooming in", "gt-answer": "C. zooming out", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1075484900_reverse": { "direction": [ { "question": "Which way is the child facing in relation to the man?\nA. Forward\nB. Turning towards the man\nC. Turning away from the man\nD. Backward", "gt-answer": "B. Turning towards the man", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction is the child moving in relation to the man?\nA. Backward\nB. Forward\nC. Turning away from the man\nD. Turning towards the man", "gt-answer": "D. Turning towards the man", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the orientation of the child with respect to the man?\nA. Downwards\nB. Upwards\nC. Turning away from the man\nD. Turning towards the man", "gt-answer": "D. Turning towards the man", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1090578917_reverse": { "direction": [ { "question": "What direction is the man leaping?\nA. to his left\nB. backward\nC. forward\nD. to his right", "gt-answer": "A. to his left", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which way is the man moving?\nA. left\nB. forwards\nC. right\nD. up", "gt-answer": "A. left", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the direction of the man's movement?\nA. counterclockwise\nB. horizontal\nC. vertically\nD. clockwise", "gt-answer": "B. horizontal", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1075338140_reverse": { "direction": [ { "question": "What is the direction of the ball?\nA. forward and backward\nB. spinning in place\nC. rolling from left to right\nD. rolling from right to left", "gt-answer": "D. rolling from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the ball moving?\nA. counterclockwise\nB. rolling from left to right\nC. clockwise\nD. rolling from right to left", "gt-answer": "D. rolling from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction does the ball travel?\nA. straight ahead\nB. rolling from left to right\nC. rolling from right to left\nD. floating in mid-air", "gt-answer": "C. rolling from right to left", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1067268403_reverse": { "direction": [ { "question": "What is the movement direction of the wind turbines?\nA. Stationary\nB. Rotating clockwise\nC. Rotating counterclockwise", "gt-answer": "C. Rotating counterclockwise", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which way are the wind turbines rotating?\nA. Randomly\nB. Clockwise\nC. Anti-clockwise", "gt-answer": "C. Anti-clockwise", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In which direction are the wind turbines turning?\nA. Anticlockwise\nB. Still\nC. Clockwise", "gt-answer": "A. Anticlockwise", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the rotational direction of the wind turbines?\nA. Clockwise\nB. Anti-clockwise\nC. Unchanging", "gt-answer": "B. Anti-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1096007487_reverse": { "direction": [ { "question": "From the camera's point of view, in which direction is the 3d cloud moving?\nA. upward\nB. downward\nC. leftward\nD. rightward", "gt-answer": "D. rightward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the 3d cloud moving from the camera's point of view?\nA. contracting\nB. spinning leftward\nC. spinning rightward\nD. expanding", "gt-answer": "C. spinning rightward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement pattern of the 3d cloud as seen from the camera's point of view?\nA. from right to left\nB. rotating clockwise\nC. rotating counter-clockwise\nD. from left to right", "gt-answer": "D. from left to right", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1095939659_reverse": { "direction": [ { "question": "In which direction is the light growing?\nA. Downwards\nB. Clockwise\nC. Counterclockwise\nD. Upwards", "gt-answer": "C. Counterclockwise", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the direction of the light's movement?\nA. Clockwise\nB. Anticlockwise\nC. Straight forward\nD. Downwards", "gt-answer": "B. Anticlockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the light changing direction?\nA. Spinning vertically\nB. Rotating clockwise\nC. Shifting diagonally\nD. Disappearing counterclockwise", "gt-answer": "D. Disappearing counterclockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1098785169_reverse": { "direction": [ { "question": "What is the direction of the galaxy's spin?\nA. counterclockwise\nB. left to right\nC. clockwise\nD. up and down", "gt-answer": "A. counterclockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the galaxy rotating?\nA. backward\nB. counter clockwise\nC. clockwise\nD. forward", "gt-answer": "B. counter clockwise", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How is the galaxy spinning?\nA. backward\nB. counter clockwise\nC. clockwise\nD. forward", "gt-answer": "B. counter clockwise", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1099984801_reverse": { "direction": [ { "question": "What is the movement of the clouds?\nA. moving away from the camera\nB. staying still\nC. moving towards the camera", "gt-answer": "A. moving away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction are the clouds heading?\nA. towards the camera\nB. upward\nC. downward\nD. away from the camera", "gt-answer": "D. away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement direction of the clouds?\nA. forward\nB. in a circular motion\nC. side to side\nD. backward", "gt-answer": "A. forward", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "What is happening to the entire video?\nA. staying the same\nB. getting darker\nC. getting brighter", "gt-answer": "C. getting brighter", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What change is occurring to the light condition of the video?\nA. getting darker\nB. remaining stable\nC. getting brighter", "gt-answer": "C. getting brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following best describes the change in the entire video?\nA. getting darker\nB. getting blurry\nC. turning brighter", "gt-answer": "C. turning brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1082419672_reverse": { "direction": [ { "question": "What is the direction of movement in the video?\nA. hovering\nB. flying forwards\nC. flying backwards", "gt-answer": "B. flying forwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the trajectory of the movement?\nA. straight line\nB. arc-shaped\nC. zigzag", "gt-answer": "A. straight line", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In what direction is the entire video moving relative to the ship?\nA. forward\nB. up\nC. down\nD. backward", "gt-answer": "A. forward", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1058985719_reverse": { "direction": [ { "question": "What is the direction in which the airplane is flying?\nA. bottom to top\nB. right to left\nC. top to bottom\nD. left to right", "gt-answer": "C. top to bottom", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the airplane moving on the screen?\nA. anticlockwise\nB. upwards\nC. clockwise\nD. downwards", "gt-answer": "D. downwards", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the trajectory of the airplane?\nA. vertically upwards\nB. vertically downwards\nC. horizontally rightwards\nD. horizontally leftwards", "gt-answer": "B. vertically downwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055413730_reverse": { "direction": [ { "question": "In which direction is the planet Earth spinning?\nA. Rightwards\nB. Downwards\nC. Leftwards\nD. Upwards", "gt-answer": "C. Leftwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Considering the camera's perspective, what is the rotational movement of the planet Earth?\nA. spinning to the left\nB. rotating upward\nC. spinning to the right", "gt-answer": "A. spinning to the left", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the apparent motion of the Earth based on the camera's viewpoint?\nA. away from the camera\nB. towards the camera\nC. spinning to the right\nD. spinning to the left", "gt-answer": "D. spinning to the left", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1081684532_reverse": { "direction": [ { "question": "What is the direction of the asteroids in the video?\nA. flying away from the camera\nB. flying to the left\nC. flying towards the camera\nD. flying to the right", "gt-answer": "A. flying away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which direction are the asteroids moving?\nA. downwards\nB. towards the camera\nC. upwards\nD. away from the camera", "gt-answer": "D. away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way are the asteroids going?\nA. towards the camera\nB. parallel to the camera\nC. away from the camera", "gt-answer": "C. away from the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "23391142_reverse": { "direction": [ { "question": "What direction is the video panning?\nA. Upwards\nB. Downwards\nC. To the left\nD. To the right", "gt-answer": "C. To the left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement of the video?\nA. Zoom in\nB. Panning to the left\nC. Zoom out\nD. Panning to the right", "gt-answer": "B. Panning to the left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the scene shifting?\nA. Panning to the left\nB. Panning to the right\nC. Away from the camera\nD. Towards the camera", "gt-answer": "A. Panning to the left", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1053758117_reverse": { "direction": [ { "question": "What is happening in the video?\nA. Zoom out from a 3D digital brain\nB. Standing still before a 3D digital brain\nC. Zoom into a 3D digital brain", "gt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the camera moving in the video?\nA. zooming in\nB. downwards\nC. upwards\nD. zooming out", "gt-answer": "D. zooming out", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the trajectory of the video's direction?\nA. panning right\nB. panning left\nC. zooming out\nD. zooming in", "gt-answer": "C. zooming out", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1106668103_reverse": { "direction": [ { "question": "What is the direction of movement in the video?\nA. staying still\nB. moving forward\nC. moving backward", "gt-answer": "C. moving backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what way is the primary motion depicted in the video?\nA. turning leftward\nB. moving forward\nC. moving backward\nD. turning rightward", "gt-answer": "C. moving backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the primary trajectory in the video?\nA. descending\nB. moving backward\nC. moving forward", "gt-answer": "B. moving backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1057163434_reverse": { "direction": [ { "question": "What is the chef doing with the bread?\nA. removing it from the top of the burger\nB. putting it on top of the burger\nC. putting it inside the burger\nD. throwing it away", "gt-answer": "A. removing it from the top of the burger", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which direction is the chef moving the bread?\nA. throwing it away\nB. removing it from the burger\nC. putting it on top of the burger\nD. putting it inside the burger", "gt-answer": "B. removing it from the burger", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which action is the chef performing with the bread?\nA. putting it on top of the burger\nB. picking it up from the burger\nC. inserting it inside the burger", "gt-answer": "B. picking it up from the burger", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100319395_reverse": { "direction": [ { "question": "What direction is the circular pattern moving?\nA. clockwise\nB. moving towards the camera\nC. counter-clockwise\nD. moving away from the camera", "gt-answer": "C. counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the circular pattern moving?\nA. spinning clockwise\nB. spinning counter-clockwise\nC. vibrating back and forth", "gt-answer": "B. spinning counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the circular pattern spinning?\nA. towards the screen\nB. anticlockwise\nC. clockwise\n D. away from the screen", "gt-answer": "B. anticlockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1101200293_reverse": { "direction": [ { "question": "What is the direction of the camera motion relative to the aircraft carrier?\nA. counterclockwise\nB. downward\nC. upward\nD. clockwise", "gt-answer": "A. counterclockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which way is the camera moving around the aircraft carrier?\nA. clockwise\nB. back and forth\nC. tilting upwards\nD. counterclockwise", "gt-answer": "D. counterclockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what direction is the camera flying around the aircraft carrier?\nA. clockwise\nB. descending\nC. ascending\nD. anti-clockwise", "gt-answer": "D. anti-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1072453637_reverse": { "direction": [ { "question": "What is the direction of the camera panning in the video?\nA. panning to the back of a fighter jet\nB. panning downwards around a fighter jet\nC. panning upwards around a fighter jet\nD. panning to the front of a fighter jet", "gt-answer": "D. panning to the front of a fighter jet", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the camera's panning orientation in the video?\nA. Moving to the front of a fighter jet\nB. Ascending around a fighter jet\nC. Moving to the rear of a fighter jet\nD. Descending around a fighter jet", "gt-answer": "A. Moving to the front of a fighter jet", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Identify the camera's panning movement in the video.\nA. Panning to the back of a fighter jet\nB. Panning upward around a fighter jet\nC. Panning downward around a fighter jet\nD. Panning to the front of a fighter jet", "gt-answer": "D. Panning to the front of a fighter jet", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3396473605_reverse": { "direction": [ { "question": "In which direction do the five stars disappear?\nA. from right to left\nB. from top to bottom\nC. from left to right\nD. from bottom to top", "gt-answer": "A. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which star disappears first?\nA. the star in the center\nB. the star in the right\nC. the star in the left\nD. all stars appear at the same time", "gt-answer": "B. the star in the right", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction that the stars disappear?\nA. from right to left\nB. from left to right\nC. upwards\nD. downwards", "gt-answer": "A. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1086820415_reverse": { "direction": [ { "question": "What is the direction of motion of the large wave?\nA. moving vertically towards the top of the screen\nB. moving horizontally towards the right side of the screen\nC. moving vertically towards the bottom of the screen\nD. moving horizontally towards the left side of the screen", "gt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which direction does the large wave move in the video?\nA. vertically towards the top of the screen\nB. diagonally towards the bottom-right corner\nC. vertically towards the bottom of the screen\nD. diagonally towards the top-left corner", "gt-answer": "A. vertically towards the top of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the large wave travel across the screen?\nA. moving vertically towards the bottom\nB. contracting towards the center\nC. moving vertically towards the top\nD. expanding from the center", "gt-answer": "C. moving vertically towards the top", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1073831006_reverse": { "direction": [ { "question": "What is the direction of the zebras' movement?\nA. from right to left\nB. from left to right\nC. from top to bottom", "gt-answer": "A. from right to left", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction are the zebras moving?\nA. from left to right relative to the camera\nB. away from the camera\nC. towards the camera\nD. from right to left relative to the camera", "gt-answer": "D. from right to left relative to the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction are the zebras heading?\nA. downward\nB. leftward\nC. rightward\nD. upward", "gt-answer": "B. leftward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1024867412_reverse": { "direction": [ { "question": "What direction is the car driving?\nA. Taking a left turn\nB. Going straight\nC. Taking a right turn\nD. Going backward", "gt-answer": "A. Taking a left turn", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which direction is the car moving?\nA. Left\nB. Right\nC. Backward\nD. Forward", "gt-answer": "A. Left", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What maneuver is the car making?\nA. Making a left turn\nB. Parked on the street\nC. Driving backward\nD. Making a right turn", "gt-answer": "A. Making a left turn", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1076877854_reverse": { "direction": [ { "question": "Which direction is the closest robotic arm moving from the camera's point of view?\nA. To the right side of the screen\nB. Towards the camera\nC. Away from the camera\nD. To the left side of the screen", "gt-answer": "D. To the left side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What motion can be observed about the closest robotic arm?\nA. Rotating\nB. Moving to the left side of the screen\nC. Oscillating\nD. Moving to the right side of the screen", "gt-answer": "B. Moving to the left side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What kind of movement does the closest robotic arm exhibit?\nA. Shifting to the left side of the screen\nB. Ascending and descending\nC. Shifting to the right side of the screen\nD. Swaying back and forth", "gt-answer": "A. Shifting to the left side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1100468035_reverse": { "direction": [ { "question": "What is the direction of the camera in the video?\nA. zooming backward\nB. zooming forward\nC. tracking right\nD. panning left", "gt-answer": "A. zooming backward", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which direction is the camera moving towards?\nA. zooming backward\nB. ascending upward\nC. sliding left\nD. zooming forward", "gt-answer": "A. zooming backward", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "In what manner is the camera moving?\nA. zooming backward\nB. dollying up\nC. zooming forward\nD. tilting down", "gt-answer": "A. zooming backward", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the door?\nA. remaining closed\nB. closing\nC. gradually opening", "gt-answer": "B. closing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the door changing?\nA. by gradually opening\nB. by shrinking\nC. by staying the same\nD. by gradually closing", "gt-answer": "D. by gradually closing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What option best describes the change of the door?\nA. opening\nB. staying closed\nC. staying half-opened\nD. closing", "gt-answer": "D. closing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3411806181_reverse": { "direction": [ { "question": "Which direction is the person moving the charging gun?\nA. Away from the car\nB. Parallel to the car\nC. Towards the car", "gt-answer": "A. Away from the car", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is the person performing on the charging gun?\nA. holding it still\nB. unpluging it from the car\nC. plugging it into the car", "gt-answer": "B. unpluging it from the car", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Towards which side is the person moving the charging gun?\nA. himself\nB. the car\nC. none of both", "gt-answer": "A. himself", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1073914229_reverse": { "direction": [ { "question": "What direction are the trains moving?\nA. in the same direction\nB. towards each other\nC. away from each other", "gt-answer": "C. away from each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what manner are the trains traveling?\nA. stopped\nB. in the same direction\nC. towards each other\nD. away from each other", "gt-answer": "D. away from each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the trajectory of the trains?\nA. perpendicular to each other\nB. moving away from each other\nC. proceeding in the same way\nD. moving towards each other", "gt-answer": "B. moving away from each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1093139559_reverse": { "direction": [ { "question": "What is the type of camera motion in the video? \nA. Zooming into three football players\nB. Panning left\nC. Panning right\nD. Zooming out from three football palyers", "gt-answer": "D. Zooming out from three football palyers", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the camera moving? \nA. Zooming in\nB. Upwards\nC. Zooming out\nD. Downwards", "gt-answer": "C. Zooming out", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which option best describes the camera's motion? \nA. Tilting upwards\nB. Zooming forward\nC. Zooming backward\nD. Standing still", "gt-answer": "C. Zooming backward", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "What is happening to the light condition on the football players?\nA. staying the same\nB. turning darker\nC. turning brighter", "gt-answer": "B. turning darker", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How would you describe the change in light on the football players?\nA. dimming\nB. flickering\nC. intensifying", "gt-answer": "A. dimming", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which statement accurately describes the change on the football players?\nA. becoming blurry\nB. becoming more visible\nC. becoming dimmer", "gt-answer": "C. becoming dimmer", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1080591311_reverse": { "direction": [ { "question": "What direction is the jellyfish moving?\nA. moving towards the right\nB. floating upwards\nC. moving towards the left\nD. sinking downwards", "gt-answer": "D. sinking downwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of motion for the jellyfish?\nA. floating to the right\nB. floating to the left\nC. floating downwards\nD. floating upwards", "gt-answer": "C. floating downwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which way is the jellyfish moving?\nA. going down\nB. going away from the screen\nC. going towards the screen\nD. going up", "gt-answer": "A. going down", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "3411228673_reverse": { "direction": [ { "question": "What is the direction of the movement in the video?\nA. sideways along the skyscraper buildings\nB. upwards among skyscraper buildings\nC. downwards towards the ground", "gt-answer": "C. downwards towards the ground", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the camera moving?\nA. backwards\nB. forwards\nC. downwards\nD. upwards", "gt-answer": "C. downwards", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the path of movement in the video?\nA. flying downwards\nB. flying forwards\nC. flying backwards\nD. flying upwards", "gt-answer": "A. flying downwards", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1093737353_reverse": { "direction": [ { "question": "What type of motion is the camera performing in the video?\nA. panning to the right\nB. panning to the left\nC. tilting up\nD. zooming in", "gt-answer": "B. panning to the left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the camera moving?\nA. downwards\nB. rightwards\nC. leftwards\nD. upwards", "gt-answer": "C. leftwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the direction of the camera's movement?\nA. panning to the left\nB. panning to the right\nC. backwards\nD. forwards", "gt-answer": "A. panning to the left", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1017768724_reverse": { "direction": [ { "question": "What is the direction of the person's movement?\nA. moving upwards\nB. moving leftwards\nC. moving downwards\nD. moving rightwards", "gt-answer": "B. moving leftwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the person heading?\nA. vertically\nB. backward\nC. forward\nD. horizontally", "gt-answer": "D. horizontally", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "How is the person moving?\nA. moving rightwards\nB. jumping upwards\nC. moving leftwards\nD. running forwards", "gt-answer": "C. moving leftwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100117263_reverse": { "direction": [ { "question": "What is the direction of the little lion's motion?\nA. downward\nB. upward\nC. towards the camera\nD. rightward", "gt-answer": "B. upward", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the little lion doing?\nA. sitting nearby an adult lion\nB. sitting on the back of an adult lion\nC. falling from the back of an adult lion\nD. jumping onto the back of an adult lion", "gt-answer": "D. jumping onto the back of an adult lion", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In what direction is the little lion going?\nA. falling down\nB. climbing up\nC. walking forward\nD. walking backward", "gt-answer": "B. climbing up", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1021488277_reverse": { "direction": [ { "question": "What is happening in the video? \nA. A person drops down the pineapple\nB. A person pushes forward the pineapple\nC. A person rotates the pineapple\nD. A person picks up the pineapple", "gt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What action is taking place in the video?\nA. The pineapple is being dropped by a person.\nB. The pineapple is being rotated by a person.\nC. The pineapple is being pushed forward by a person.\nD. The pineapple is being picked up by a person.", "gt-answer": "A. The pineapple is being dropped by a person.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What can be observed in the video?\nA. The pineapple is rotated by a person.\nB. The pineapple is pushed in a forward direction.\nC. The pineapple is lifted by an individual.\nD. The pineapple is put down.", "gt-answer": "D. The pineapple is put down.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100397435_reverse": { "direction": [ { "question": "What direction is the robot vacuum cleaner moving in the video?\nA. to the right side of the screen\nB. to the left side of the screen\nC. towards the screen\nD. away from the screen", "gt-answer": "B. to the left side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the movement pattern of the robot vacuum cleaner?\nA. straight line towards the screen\nB. straight line to the right side of the screen\nC. straight line to the left side of the screen\nD. straight line away from the screen", "gt-answer": "C. straight line to the left side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Where is the robot vacuum cleaner heading?\nA. to the lower side of the screen\nB. to the upper side of the screen\nC. to the left side of the screen\nD. to the right side of the screen", "gt-answer": "C. to the left side of the screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1108534143_reverse": { "direction": [ { "question": "What is the puppy doing in the video?\nA. staying in a wigwam\nB. walking into a wigwam\nC. walking out of a wigwam", "gt-answer": "B. walking into a wigwam", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the puppy moving?\nA. walking out of a wigwam\nB. entring a wigwam\nC. walking around a wigwam", "gt-answer": "B. entring a wigwam", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is the puppy taking?\nA. entring a wigwam\nB. walking out of a wigwam\nC. walking around a wigwam", "gt-answer": "A. entring a wigwam", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1047368344_reverse": { "direction": [ { "question": "What is the girl doing?\nA. jumping into water\nB. jumping around water\nC. swimming in the water\nD. jumping out of water", "gt-answer": "D. jumping out of water", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the girl moving?\nA. towards the camera\nB. towards the water\nC. away from the water", "gt-answer": "C. away from the water", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which direction is the girl moving?\nA. towards the water\nB. away from the water\nC. inside the water", "gt-answer": "B. away from the water", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1050618460_reverse": { "attribute_change": [ { "question": "What is happening to the flowers?\nA. turning into buds\nB. shrinking and wilting\nC. turning into full bloom\nD. remaining as buds", "gt-answer": "A. turning into buds", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How do the flowers transform?\nA. from stem to leaf\nB. from full bloom to bud\nC. from seed to germination\nD. from bud to full bloom", "gt-answer": "B. from full bloom to bud", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What happens when the flowers go through the attribute_change?\nA. reaching full maturity\nB. shedding leaves\nC. sprouting more buds\nD. shrinking into buds", "gt-answer": "D. shrinking into buds", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1083113449_reverse": { "attribute_change": [ { "question": "How would you describe the change in the sky's appearance?\nA. lightening up\nB. maintaining its brightness\nC. getting darker", "gt-answer": "A. lightening up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is occurring to the sky?\nA. staying the same\nB. getting darker\nC. brightening", "gt-answer": "C. brightening", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In terms of illumination, what is happening to the sky?\nA. becoming brighter\nB. growing dimmer\nC. remaining unchanged", "gt-answer": "A. becoming brighter", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1091143117_reverse": { "attribute_change": [ { "question": "What is happening to the eye?\nA. from closed to open\nB. turning red\nC. becoming blurry\nD. from open to closed", "gt-answer": "D. from open to closed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the eye changing?\nA. changing color\nB. from closed to open\nC. becoming smaller\nD. from open to closed", "gt-answer": "D. from open to closed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What transformation is occurring in the eye?\nA. from open to closed\nB. shrinking\nC. from closed to open\nD. blinking", "gt-answer": "A. from open to closed", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1098153561_reverse": { "attribute_change": [ { "question": "What is happening to the leaves?\nA. changing shape\nB. falling off\nC. changing color from green to red\nD. changing color from red to green", "gt-answer": "D. changing color from red to green", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the initial color of the leaves?\nA. red\nB. white\nC. green", "gt-answer": "A. red", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the final color of the leaves?\nA. white\nB. red\nC. green", "gt-answer": "C. green", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1059072773_reverse": { "attribute_change": [ { "question": "What is happening to the ice cream?\nA. melting\nB. freezing\nC. evaporating\nD. solidifying", "gt-answer": "D. solidifying", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the ice cream changing?\nA. changing color\nB. being eaten out\nC. turning into liquid\nD. solidifying into a ball", "gt-answer": "D. solidifying into a ball", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which term best describes the state change of the ice cream?\nA. evaporation\nB. solidifying\nC. melting", "gt-answer": "B. solidifying", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1093573255_reverse": { "attribute_change": [ { "question": "What is happening to the plant?\nA. wilting\nB. reviving\nC. shedding leaves\nD. turning into buds", "gt-answer": "A. wilting", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the plant changing?\nA. withering away\nB. turning yellow\nC. reviving\nD. blooming", "gt-answer": "A. withering away", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what way is the plant transforming?\nA. wilting\nB. rotting\nC. reviving\nD. shedding leaves", "gt-answer": "A. wilting", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1077146132_reverse": { "attribute_change": [ { "question": "What is happening to the video?\nA. staying the same brightness\nB. turning darker\nC. turning brighter", "gt-answer": "B. turning darker", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the video change in terms of brightness?\nA. decreasing\nB. remaining constant\nC. increasing", "gt-answer": "A. decreasing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is occurring with the video's attribute?\nA. maintaining steady brightness\nB. getting brighter\nC. getting dimmer", "gt-answer": "C. getting dimmer", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086688682_reverse": { "attribute_change": [ { "question": "What change is happening to the traffic lights?\nA. From red to green\nB. From red to yellow\nC. From yellow to red\nD. From green to red", "gt-answer": "D. From green to red", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the attribute change occurring to the traffic lights?\nA. Changing color sequence\nB. Dimming brightness\nC. Switching off\nD. Blinking rapidly", "gt-answer": "A. Changing color sequence", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What alteration is taking place to the traffic lights?\nA. Transitioning from yellow to green\nB. Transitioning from green to yellow\nC. Transitioning from red to green\nD. Transitioning from green to red", "gt-answer": "D. Transitioning from green to red", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1099738787_reverse": { "attribute_change": [ { "question": "What is happening to the concrete wall?\nA. melting\nB. falling apart\nC. assembling together", "gt-answer": "C. assembling together", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the attribute change of the concrete wall?\nA. rebuilding\nB. shrinking\nC. disappearing\nD. falling apart", "gt-answer": "A. rebuilding", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "In what state is the concrete wall?\nA. expanding\nB. assembling together\nC. falling apart\nD. intact", "gt-answer": "B. assembling together", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1094219575_reverse": { "attribute_change": [ { "question": "What is happening to the flowers?\nA. growing taller\nB. changing color\nC. blooming\nD. wilting", "gt-answer": "C. blooming", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the condition of the flowers?\nA. decaying\nB. dormant\nC. budding\nD. blooming", "gt-answer": "D. blooming", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the transformation occurring to the flowers?\nA. reproducing through seeds\nB. changing from withered to full blossom\nC. changing from full blossom to withered\nD. sprouting new buds", "gt-answer": "B. changing from withered to full blossom", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1067427023_reverse": { "attribute_change": [ { "question": "Which term best describes the transformation happening to the snow particles?\nA. solidifying\nB. melting\nC. scattering", "gt-answer": "A. solidifying", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What change is occurring to the snow particles?\nA. remaining the same\nB. growing in size\nC. decreasing in size", "gt-answer": "B. growing in size", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In the given scenario, what is the primary attribute change experienced by the snow particles?\nA. freezing\nB. melting\nC. scattering", "gt-answer": "A. freezing", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1093948229_reverse": { "attribute_change": [ { "question": "What is happening to the golden particles?\nA. melting\nB. shrinking\nC. spinning\nD. exploding", "gt-answer": "B. shrinking", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which of the following best describes the change in the attribute of the golden particles?\nA. freezing\nB. exploding\nC. melting\nD. shrinking", "gt-answer": "D. shrinking", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which word below represents the transformation taking place on the golden particles?\nA. contracting\nB. melting\nC. exploding\nD. condensing", "gt-answer": "A. contracting", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1049965795_reverse": { "attribute_change": [ { "question": "What is happening to the light bulb?\nA. turning off\nB. breaking\nC. light up\nD. rapidly changing color", "gt-answer": "A. turning off", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What change occurs in the light bulb?\nA. becoming darker\nB. getting smaller\nC. light up\nD. flickering", "gt-answer": "A. becoming darker", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What alteration takes place in the light bulb?\nA. rusting\nB. turn off\nC. crackling\nD. light up", "gt-answer": "B. turn off", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1052364490_reverse": { "attribute_change": [ { "question": "What is happening to the digital bar chart?\nA. staying in the same size\nB. increasing\nC. decreasing", "gt-answer": "C. decreasing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "The digital bar chart is experiencing what kind of change?\nA. decreasing\nB. growing\nC. fluctuating", "gt-answer": "A. decreasing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What alteration is taking place to the digital bar chart?\nA. levelling out\nB. growing\nC. disappearing", "gt-answer": "C. disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1080990179_reverse": { "attribute_change": [ { "question": "What is happening to the apple?\nA. being cut\nB. shrinking and drying out\nC. growing bigger", "gt-answer": "C. growing bigger", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the apple changing?\nA. getting smaller\nB. remaining in the same shape\nC. getting bigger", "gt-answer": "C. getting bigger", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the change in the apple's attributes?\nA. swelling and becoming juicy\nB. shrinking and drying out\nC. being cut and getting smaller", "gt-answer": "A. swelling and becoming juicy", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1077575504_reverse": { "attribute_change": [ { "question": "What is happening to the pile of salt?\nA. scattering\nB. growing\nC. melting\nD. disappearing", "gt-answer": "D. disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which one of the following is an attribute change happening to the pile of salt?\nA. shrinking\nB. growing\nC. burning\nD. dissolving", "gt-answer": "A. shrinking", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "How is the pile of salt changing?\nA. melting\nB. unchanged\nC. growing bigger\nD. becoming smaller", "gt-answer": "D. becoming smaller", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "23370985_reverse": { "attribute_change": [ { "question": "What is happening to the ice crystal?\nA. freezing\nB. melting\nC. shattering", "gt-answer": "B. melting", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What process is occurring with the ice crystal?\nA. reducing in size\nB. turning into water\nC. growing in size\nD. remaining the same", "gt-answer": "A. reducing in size", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What transformation is taking place in the ice crystal?\nA. cracking\nB. unchanged\nC. melting\nD. forming", "gt-answer": "C. melting", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055981522_reverse": { "attribute_change": [ { "question": "What is happening to the 3d shapes?\nA. disappearing\nB. turning into triangles\nC. turning into spheres\nD. turning into cubes", "gt-answer": "D. turning into cubes", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the attribute change of the 3d shapes?\nA. transforming from cubes into spheres\nB. transforming from spheres into cubes\nC. remaining as cubes\nD. remaining as spheres", "gt-answer": "B. transforming from spheres into cubes", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which shape are the 3d shapes transforming into?\nA. cubes\nB. triangles\nC. spheres\nD. pentagons", "gt-answer": "A. cubes", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1081734740_reverse": { "attribute_change": [ { "question": "What is happening to the texture of the leaf?\nA. It is turning from green to yellow\nB. It is turning from white to green\nC. It is turning from green to white\nD. It is turning from yellow to green", "gt-answer": "D. It is turning from yellow to green", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What color is the leaf turning into?\nA. White\nB. Green\nC. Yellow", "gt-answer": "B. Green", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What change is occurring in the leaf?\nA. It is getting smaller\nB. It is becoming white\nC. It is becoming yellow\nD. It is becoming green", "gt-answer": "D. It is becoming green", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1093719871_reverse": { "attribute_change": [ { "question": "What is happening to the pink flowers?\nA. growing taller\nB. falling off petals\nC. turning from withered to full blossom\nD. turning from full blossom to withered", "gt-answer": "D. turning from full blossom to withered", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "How are the pink flowers transforming?\nA. from small buds to big flowers\nB. from full blossom to withered\nC. from half-open to closed\nD. from withered to full blossom", "gt-answer": "B. from full blossom to withered", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the final appearance of the pink flowers?\nA. small buds\nB. died petals\nC. fresh leaves\nD. fully bloomed", "gt-answer": "B. died petals", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1055973887_reverse": { "attribute_change": [ { "question": "What is happening to the fire ball? \nA. staying the same size\nB. getting smaller\nC. getting larger", "gt-answer": "B. getting smaller", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "How is the fire ball changing? \nA. splitting in half\nB. expanding out\nC. contracting into the center", "gt-answer": "C. contracting into the center", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In what way is the fire ball transforming? \nA. changing into a cube size\nB. shrinking in size\nC. growing in size", "gt-answer": "B. shrinking in size", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1098710341_reverse": { "attribute_change": [ { "question": "What is happening to the glass?\nA. It is changing color\nB. It is going from full of water to empty\nC. It is going from empty to full of water\nD. It is transforming into a different shape", "gt-answer": "B. It is going from full of water to empty", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the final state of the glass?\nA. It is broken into pieces\nB. It is about 70% full with water\nC. It is half full with water\nD. It is empty", "gt-answer": "D. It is empty", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In whay way is the glass changing?\nA. Water was disappearing from the glass\nB. The glass was heated\nC. Water was poured into the glass\nD. A chemical reaction occurred in the glass", "gt-answer": "A. Water was disappearing from the glass", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1099116143_reverse": { "attribute_change": [ { "question": "What is happening to the pink liquid?\nA. White foam disappears from the surface\nB. White foam appears on the surface\nC. It is freezing\nD. It is evaporating", "gt-answer": "A. White foam disappears from the surface", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What can be observed visually on the pink liquid?\nA. White foam appears on the surface\nB. The liquid is turning transparent\nC. White foam disappears from the surface", "gt-answer": "C. White foam disappears from the surface", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the appearance of the pink liquid affected?\nA. White foam appears on the surface\nB. It becomes blue\nC. White foam disappears from the surface\nD. It becomes green", "gt-answer": "C. White foam disappears from the surface", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1025623079_reverse": { "attribute_change": [ { "question": "What is happening to the skyscraper?\nA. lighting up\nB. growing taller\nC. in construction\nD. collapsing", "gt-answer": "B. growing taller", "video-llm-prediction": "D", "match_success": true, "rating": 0 }, { "question": "What is the condition of the skyscraper?\nA. in construction\nB. collapsing\nC. being eracted\nD. burning in fire", "gt-answer": "C. being eracted", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What change is occurring with the skyscraper?\nA. burning in fire\nB. collapsing\nC. standing up\nD. turning darker", "gt-answer": "C. standing up", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1063373449_reverse": { "attribute_change": [ { "question": "What is happening to the coronavirus?\nA. replicating itself\nB. mutating into a new strain\nC. assembling together\nD. dissolving under the attack of antibodies", "gt-answer": "C. assembling together", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the coronavirus responding to antibodies?\nA. replicating itself\nB. dissolving under their attack\nC. avoiding them by hiding in cells\nD. assembling together", "gt-answer": "D. assembling together", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What occurs to the coronavirus?\nA. it assembles together\nB. it grows larger\nC. it dissolves\nD. it replicates", "gt-answer": "A. it assembles together", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1062609286_reverse": { "attribute_change": [ { "question": "What is happening to the battery charge?\nA. decreasing\nB. staying constant\nC. increasing", "gt-answer": "A. decreasing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the battery charge changing?\nA. increasing\nB. random\nC. decreasing", "gt-answer": "C. decreasing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which option describes the change of the battery charge?\nA. decreasing\nB. increasing\nC. staying the same", "gt-answer": "A. decreasing", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1060403198_reverse": { "attribute_change": [ { "question": "What is happening to the tree?\nA. increasing height\nB. decreasing height\nC. shedding leaves\nD. changing color", "gt-answer": "B. decreasing height", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which attribute of the tree is undergoing a transformation?\nA. position\nB. height\nC. color", "gt-answer": "B. height", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What term can be used to describe the change happening to the tree?\nA. wilting\nB. growing in size\nC. falling down\nD. reducing in size", "gt-answer": "D. reducing in size", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1099109715_reverse": { "attribute_change": [ { "question": "What is happening to the number of fruits and vegetables?\nA. becoming rotten\nB. increasing\nC. decreasing\nD. staying the same", "gt-answer": "C. decreasing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the change to the fruits and vegetables?\nA. disappearing\nB. increasing number\nC. staying the same\nD. decaying", "gt-answer": "A. disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which is the most accurate statement about the number of fruits and vegetables?\nA. It is getting bigger.\nB. It is getting smaller.\nC. It is changing sporadically.\nD. It is remaining constant.", "gt-answer": "B. It is getting smaller.", "video-llm-prediction": "D", "match_success": true, "rating": 0 } ] }, "1051211272_reverse": { "attribute_change": [ { "question": "What is happening to the toast with cream cheese?\nA. gradually reappearing piece by piece\nB. staying the same size\nC. gradually being eaten out and disappearing", "gt-answer": "A. gradually reappearing piece by piece", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What alteration is taking place with the cream cheese-covered toast?\nA. Gradually emerging piece by piece\nB. Remaining constant in size\nC. Slowly diminishing as it is consumed", "gt-answer": "A. Gradually emerging piece by piece", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the outcome of the toast with cream cheese?\nA. it gradually reappears piece by piece\nB. it gradually disappears piece by piece\nC. it gradually spoils", "gt-answer": "A. it gradually reappears piece by piece", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1059815936_reverse": { "attribute_change": [ { "question": "What is happening to the paper?\nA. changing from a wrinkled paper ball into a flattened sheet\nB. changing from a flattened sheet into scraps of paper\nC. changing from a flattened sheet into a wrinkled paper ball", "gt-answer": "C. changing from a flattened sheet into a wrinkled paper ball", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the paper transform?\nA. crumpling into a ball\nB. tearing apart\nC. unfolding", "gt-answer": "A. crumpling into a ball", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the main change occurring in the paper?\nA. changing teared apart\nB. being folded\nC. being flattened out", "gt-answer": "B. being folded", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1059718130_concat_0": { "speed": [ { "question": "What is the speed of the sun above?\nA. rising slower than the sun below\nB. rising faster than the sun below\nC. rising at the same speed as the sun below", "gt-answer": "C. rising at the same speed as the sun below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which sun is rising faster?\nA. the sun below\nB. Both suns are rising at the same speed\nC. the sun above", "gt-answer": "B. Both suns are rising at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the sun above compare to the speed of the sun below?\nA. The sun above is rising slower than the sun below\nB. The sun above and the sun below have the same speed\nC. The sun above is rising faster than the sun below", "gt-answer": "B. The sun above and the sun below have the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059718130_concat_1": { "speed": [ { "question": "What is the speed of the sun above?\nA. rising faster than the sun below\nB. rising slower than the sun below\nC. rising at the same speed as the sun below", "gt-answer": "B. rising slower than the sun below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which sun is rising faster?\nA. the sun above\nB. Both suns are rising at the same speed\nC. the sun below", "gt-answer": "C. the sun below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the sun above compare to the speed of the sun below?\nA. The sun above is rising faster than the sun below\nB. The sun above and the sun below have the same speed\nC. The sun above is rising slower than the sun below", "gt-answer": "C. The sun above is rising slower than the sun below", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059718130_concat_2": { "speed": [ { "question": "What is the speed of the sun above?\nA. rising at the same speed as the sun below\nB. rising slower than the sun below\nC. rising faster than the sun below", "gt-answer": "C. rising faster than the sun below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which sun is rising faster?\nA. Both suns are rising at the same speed\nB. the sun below\nC. the sun above", "gt-answer": "C. the sun above", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the sun above compare to the speed of the sun below?\nA. The sun above is rising slower than the sun below\nB. The sun above and the sun below have the same speed\nC. The sun above is rising faster than the sun below", "gt-answer": "C. The sun above is rising faster than the sun below", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1098153561_concat_0": { "speed": [ { "question": "What is the speed that the forest above changing color?\nA. faster than the forest below\nB. at the same speed as the forest below\nC. slower than the forest below", "gt-answer": "B. at the same speed as the forest below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the forest above compare to the forest below?\nA. it changes color at the same speed as the forest below\nB. it changes color slower than the forest below\nC. it changes color faster than the forest below", "gt-answer": "A. it changes color at the same speed as the forest below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In relation to the speed of the forest below, how does the speed of color change in the forest above appear?\nA. Faster\nB. Slower\nC. Equally fast", "gt-answer": "C. Equally fast", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1098153561_concat_1": { "speed": [ { "question": "What is the speed that the forest above changing color?\nA. slower than the forest below\nB. faster than the forest below\nC. at the same speed as the forest below", "gt-answer": "A. slower than the forest below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the speed of the forest above compare to the forest below?\nA. it changes color faster than the forest below\nB. it changes color at the same speed as the forest below\nC. it changes color slower than the forest below", "gt-answer": "C. it changes color slower than the forest below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the speed of the forest below, how does the speed of color change in the forest above appear?\nA. Faster\nB. Slower\nC. Equally fast", "gt-answer": "B. Slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1098153561_concat_2": { "speed": [ { "question": "What is the speed that the forest above changing color?\nA. faster than the forest below\nB. slower than the forest below\nC. at the same speed as the forest below", "gt-answer": "A. faster than the forest below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the speed of the forest above compare to the forest below?\nA. it changes color at the same speed as the forest below\nB. it changes color faster than the forest below\nC. it changes color slower than the forest below", "gt-answer": "B. it changes color faster than the forest below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the speed of the forest below, how does the speed of color change in the forest above appear?\nA. Faster\nB. Slower\nC. Equally fast", "gt-answer": "A. Faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1059462749_concat_0": { "speed": [ { "question": "How is the person above climbing compared to the person below?\nA. Climbing faster than the person below\nB. Climbing slower than the person below\nC. Climbing at the same speed as the person below", "gt-answer": "C. Climbing at the same speed as the person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be said about the speed of the person above and the person below?\nA. The person above is moving faster than the person below\nB. The person above and below are moving at the same speed\nC. The person above is moving slower than the person below", "gt-answer": "B. The person above and below are moving at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the speed of the person above compared to the person below?\nA. climbing faster\nB. climbing at the same speed\nC. climbing slower", "gt-answer": "B. climbing at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059462749_concat_1": { "speed": [ { "question": "How is the person above climbing compared to the person below?\nA. Climbing slower than the person below\nB. Climbing faster than the person below\nC. Climbing at the same speed as the person below", "gt-answer": "A. Climbing slower than the person below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What can be said about the speed of the person above and the person below?\nA. The person above is moving faster than the person below\nB. The person above and below are moving at the same speed\nC. The person above is moving slower than the person below", "gt-answer": "C. The person above is moving slower than the person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the speed of the person above compared to the person below?\nA. climbing at the same speed\nB. climbing slower\nC. climbing faster", "gt-answer": "B. climbing slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059462749_concat_2": { "speed": [ { "question": "How is the person above climbing compared to the person below?\nA. Climbing at the same speed as the person below\nB. Climbing faster than the person below\nC. Climbing slower than the person below", "gt-answer": "B. Climbing faster than the person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be said about the speed of the person above and the person below?\nA. The person above is moving faster than the person below\nB. The person above is moving slower than the person below\nC. The person above and below are moving at the same speed", "gt-answer": "A. The person above is moving faster than the person below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the speed of the person above compared to the person below?\nA. climbing faster\nB. climbing at the same speed\nC. climbing slower", "gt-answer": "A. climbing faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1059072773_concat_0": { "speed": [ { "question": "What is the speed of the ice cream above?\nA. melting at the same speed as the ice cream below\nB. melting faster than the ice cream below\nC. melting slower than the ice cream below", "gt-answer": "A. melting at the same speed as the ice cream below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the melting speed of the ice cream above compare to the ice cream below?\nA. melting slower\nB. melting faster\nC. at the same speed", "gt-answer": "C. at the same speed", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In comparison, how would you describe the speed of melting of the ice creams?\nA. The ice cream above is melting slower than the ice cream below.\nB. The ice cream above is melting faster than the ice cream below.\nC. The ice cream above is melting at the same speed as the ice cream below.", "gt-answer": "C. The ice cream above is melting at the same speed as the ice cream below.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059072773_concat_1": { "speed": [ { "question": "What is the speed of the ice cream above?\nA. melting slower than the ice cream below\nB. melting faster than the ice cream below\nC. melting at the same speed as the ice cream below", "gt-answer": "A. melting slower than the ice cream below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the melting speed of the ice cream above compare to the ice cream below?\nA. melting faster\nB. at the same speed\nC. melting slower", "gt-answer": "C. melting slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In comparison, how would you describe the speed of melting of the ice creams?\nA. The ice cream above is melting at the same speed as the ice cream below.\nB. The ice cream above is melting faster than the ice cream below.\nC. The ice cream above is melting slower than the ice cream below.", "gt-answer": "C. The ice cream above is melting slower than the ice cream below.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1059072773_concat_2": { "speed": [ { "question": "What is the speed of the ice cream above?\nA. melting at the same speed as the ice cream below\nB. melting faster than the ice cream below\nC. melting slower than the ice cream below", "gt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the melting speed of the ice cream above compare to the ice cream below?\nA. melting slower\nB. at the same speed\nC. melting faster", "gt-answer": "C. melting faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In comparison, how would you describe the speed of melting of the ice creams?\nA. The ice cream above is melting slower than the ice cream below.\nB. The ice cream above is melting at the same speed as the ice cream below.\nC. The ice cream above is melting faster than the ice cream below.", "gt-answer": "C. The ice cream above is melting faster than the ice cream below.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1090578917_concat_0": { "speed": [ { "question": "What speed is the man above jumping at?\nA. Jumping at the same speed as the man below\nB. Slower than the man below\nC. Faster than the man below", "gt-answer": "A. Jumping at the same speed as the man below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In comparison to the man below, how does the speed of the man above jumping look?\nA. Slower speed\nB. The same speed\nC. Faster speed", "gt-answer": "B. The same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which man is jumping slower than the other?\nA. The man below\nB. The man above\nC. Both man jumping at the same speed", "gt-answer": "C. Both man jumping at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1090578917_concat_1": { "speed": [ { "question": "What speed is the man above jumping at?\nA. Jumping at the same speed as the man below\nB. Slower than the man below\nC. Faster than the man below", "gt-answer": "B. Slower than the man below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In comparison to the man below, how does the speed of the man above jumping look?\nA. Faster speed\nB. The same speed\nC. Slower speed", "gt-answer": "C. Slower speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which man is jumping slower than the other?\nA. The man below\nB. The man above\nC. Both man jumping at the same speed", "gt-answer": "B. The man above", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1090578917_concat_2": { "speed": [ { "question": "What speed is the man above jumping at?\nA. Jumping at the same speed as the man below\nB. Faster than the man below\nC. Slower than the man below", "gt-answer": "B. Faster than the man below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In comparison to the man below, how does the speed of the man above jumping look?\nA. Slower speed\nB. Faster speed\nC. The same speed", "gt-answer": "B. Faster speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which man is jumping slower than the other?\nA. Both man jumping at the same speed\nB. The man below\nC. The man above", "gt-answer": "B. The man below", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1075338140_concat_0": { "speed": [ { "question": "What is the speed of the ball above?\nA. faster than the ball below\nB. slower than the ball below\nC. moving at the same speed as the ball below", "gt-answer": "C. moving at the same speed as the ball below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which ball is moving faster?\nA. the ball below\nB. the ball above\nC. same speed", "gt-answer": "C. same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Compared to the ball below, how would you describe the speed of the ball above?\nA. slower\nB. faster\nC. same", "gt-answer": "C. same", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1075338140_concat_1": { "speed": [ { "question": "What is the speed of the ball above?\nA. faster than the ball below\nB. moving at the same speed as the ball below\nC. slower than the ball below", "gt-answer": "C. slower than the ball below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which ball is moving faster?\nA. same speed\nB. the ball above\nC. the ball below", "gt-answer": "C. the ball below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Compared to the ball below, how would you describe the speed of the ball above?\nA. slower\nB. same\nC. faster", "gt-answer": "A. slower", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1075338140_concat_2": { "speed": [ { "question": "What is the speed of the ball above?\nA. moving at the same speed as the ball below\nB. faster than the ball below\nC. slower than the ball below", "gt-answer": "B. faster than the ball below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which ball is moving faster?\nA. same speed\nB. the ball below\nC. the ball above", "gt-answer": "C. the ball above", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Compared to the ball below, how would you describe the speed of the ball above?\nA. same\nB. slower\nC. faster", "gt-answer": "C. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077575504_concat_0": { "speed": [ { "question": "What is the speed of the pile of salt above?\nA. growing at the same speed as the pile of salt below\nB. growing at a faster speed than the pile of salt below\nC. growing at a slower speed than the pile of salt below", "gt-answer": "A. growing at the same speed as the pile of salt below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In comparison to the pile of salt below, how fast is the pile of salt above growing?\nA. faster\nB. slower\nC. at an equal pace", "gt-answer": "C. at an equal pace", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the speed of the pile of salt above compared to the pile of salt below?\nA. Growing faster\nB. Growing at the same rate\nC. Growing slower", "gt-answer": "B. Growing at the same rate", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077575504_concat_1": { "speed": [ { "question": "What is the speed of the pile of salt above?\nA. growing at a faster speed than the pile of salt below\nB. growing at a slower speed than the pile of salt below\nC. growing at the same speed as the pile of salt below", "gt-answer": "B. growing at a slower speed than the pile of salt below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In comparison to the pile of salt below, how fast is the pile of salt above growing?\nA. faster\nB. at an equal pace\nC. slower", "gt-answer": "C. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the speed of the pile of salt above compared to the pile of salt below?\nA. Growing faster\nB. Growing slower\nC. Growing at the same rate", "gt-answer": "B. Growing slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077575504_concat_2": { "speed": [ { "question": "What is the speed of the pile of salt above?\nA. growing at the same speed as the pile of salt below\nB. growing at a slower speed than the pile of salt below\nC. growing at a faster speed than the pile of salt below", "gt-answer": "C. growing at a faster speed than the pile of salt below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In comparison to the pile of salt below, how fast is the pile of salt above growing?\nA. faster\nB. at an equal pace\nC. slower", "gt-answer": "A. faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How would you describe the speed of the pile of salt above compared to the pile of salt below?\nA. Growing slower\nB. Growing at the same rate\nC. Growing faster", "gt-answer": "C. Growing faster", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1100319395_concat_0": { "speed": [ { "question": "What is the speed of the white circle above?\nA. faster than the white circle below\nB. slower than the white circle below\nC. rotating at the same speed as the white circle below", "gt-answer": "C. rotating at the same speed as the white circle below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Is the white circle above rotating at a different speed from the white circle below?\nA. Yes, it's rotating faster\nB. No, it's rotating slower\nC. No, it's rotating at the same speed", "gt-answer": "C. No, it's rotating at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Compared to the white circle below, how fast is the rotation of the white circle above?\nA. It rotates at the same speed\nB. It's slower\nC. It's faster", "gt-answer": "A. It rotates at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1100319395_concat_1": { "speed": [ { "question": "What is the speed of the white circle above?\nA. faster than the white circle below\nB. rotating at the same speed as the white circle below\nC. slower than the white circle below", "gt-answer": "A. faster than the white circle below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Is the white circle above rotating at a different speed from the white circle below?\nA. No, it's rotating at the same speed\nB. Yes, it's rotating faster\nC. No, it's rotating slower", "gt-answer": "B. Yes, it's rotating faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Compared to the white circle below, how fast is the rotation of the white circle above?\nA. It rotates at the same speed\nB. It's slower\nC. It's faster", "gt-answer": "C. It's faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100319395_concat_2": { "speed": [ { "question": "What is the speed of the white circle above?\nA. slower than the white circle below\nB. rotating at the same speed as the white circle below\nC. faster than the white circle below", "gt-answer": "A. slower than the white circle below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Is the white circle above rotating at a different speed from the white circle below?\nA. No, it's rotating at the same speed\nB. Yes, it's rotating faster\nC. Yes, it's rotating slower", "gt-answer": "C. Yes, it's rotating slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Compared to the white circle below, how fast is the rotation of the white circle above?\nA. It's faster\nB. It rotates at the same speed\nC. It's slower", "gt-answer": "C. It's slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086820415_concat_0": { "speed": [ { "question": "How is the speed of the wave above compared to the wave below?\nA. Moving at the same speed as the wave below\nB. Moving faster than the wave below\nC. Moving slower than the wave below", "gt-answer": "A. Moving at the same speed as the wave below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which wave is moving faster, the wave above or the wave below?\nA. The wave below\nB. Both waves are moving at the same speed\nC. The wave above", "gt-answer": "B. Both waves are moving at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Is the speed of the wave above greater, lesser, or equal to the speed of the wave below?\nA. Lesser\nB. Equal\nC. Greater", "gt-answer": "B. Equal", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086820415_concat_1": { "speed": [ { "question": "How is the speed of the wave above compared to the wave below?\nA. Moving faster than the wave below\nB. Moving slower than the wave below\nC. Moving at the same speed as the wave below", "gt-answer": "A. Moving faster than the wave below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which wave is moving faster, the wave above or the wave below?\nA. The wave below\nB. Both waves are moving at the same speed\nC. The wave above", "gt-answer": "C. The wave above", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Is the speed of the wave above greater, lesser, or equal to the speed of the wave below?\nA. Equal\nB. Lesser\nC. Greater", "gt-answer": "C. Greater", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086820415_concat_2": { "speed": [ { "question": "How is the speed of the wave above compared to the wave below?\nA. Moving at the same speed as the wave below\nB. Moving slower than the wave below\nC. Moving faster than the wave below", "gt-answer": "B. Moving slower than the wave below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which wave is moving faster, the wave above or the wave below?\nA. The wave above\nB. The wave below\nC. Both waves are moving at the same speed", "gt-answer": "B. The wave below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Is the speed of the wave above greater, lesser, or equal to the speed of the wave below?\nA. Equal\nB. Lesser\nC. Greater", "gt-answer": "B. Lesser", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1096238125_concat_0": { "speed": [ { "question": "What is the speed of the two people above lifting the kettlebell?\nA. slower than the two people below\nB. faster than the two people below\nC. at the same speed as the two people below", "gt-answer": "C. at the same speed as the two people below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the two people above lifting the kettlebell moving in relation to the two people below?\nA. at the same speed\nB. faster\nC. slower", "gt-answer": "A. at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Relative to the two people below, how fast are the two people above lifting the kettlebell moving?\nA. faster\nB. at the same speed\nC. slower", "gt-answer": "B. at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1096238125_concat_1": { "speed": [ { "question": "What is the speed of the two people above lifting the kettlebell?\nA. slower than the two people below\nB. at the same speed as the two people below\nC. faster than the two people below", "gt-answer": "C. faster than the two people below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the two people above lifting the kettlebell moving in relation to the two people below?\nA. slower\nB. faster\nC. at the same speed", "gt-answer": "B. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Relative to the two people below, how fast are the two people above lifting the kettlebell moving?\nA. slower\nB. faster\nC. at the same speed", "gt-answer": "B. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1096238125_concat_2": { "speed": [ { "question": "What is the speed of the two people above lifting the kettlebell?\nA. at the same speed as the two people below\nB. slower than the two people below\nC. faster than the two people below", "gt-answer": "B. slower than the two people below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the two people above lifting the kettlebell moving in relation to the two people below?\nA. at the same speed\nB. slower\nC. faster", "gt-answer": "B. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Relative to the two people below, how fast are the two people above lifting the kettlebell moving?\nA. at the same speed\nB. slower\nC. faster", "gt-answer": "B. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1056433484_concat_0": { "speed": [ { "question": "What is the speed of the earth above?\nA. slower than the earth below\nB. rotates at the same speed as the earth below\nC. faster than the earth below", "gt-answer": "B. rotates at the same speed as the earth below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the earth above compare to the speed of the earth below?\nA. It is slower.\nB. It is faster.\nC. It is the same.", "gt-answer": "C. It is the same.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which statement accurately describes the speed of the earth above?\nA. It rotates faster than the earth below.\nB. It rotates slower than the earth below.\nC. It rotates at the same speed as the earth below.", "gt-answer": "C. It rotates at the same speed as the earth below.", "video-llm-prediction": "A. It rotates faster than the earth below.", "match_success": true, "rating": 0 } ] }, "1056433484_concat_1": { "speed": [ { "question": "What is the speed of the earth above?\nA. faster than the earth below\nB. rotates at the same speed as the earth below\nC. slower than the earth below", "gt-answer": "C. slower than the earth below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the earth above compare to the speed of the earth below?\nA. It is slower.\nB. It is the same.\nC. It is faster.", "gt-answer": "A. It is slower.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which statement accurately describes the speed of the earth above?\nA. It rotates faster than the earth below.\nB. It rotates slower than the earth below.\nC. It rotates at the same speed as the earth below.", "gt-answer": "B. It rotates slower than the earth below.", "video-llm-prediction": "A. It rotates faster than the earth below.", "match_success": true, "rating": 0 } ] }, "1056433484_concat_2": { "speed": [ { "question": "What is the speed of the earth above?\nA. faster than the earth below\nB. rotates at the same speed as the earth below\nC. slower than the earth below", "gt-answer": "A. faster than the earth below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the speed of the earth above compare to the speed of the earth below?\nA. It is slower.\nB. It is faster.\nC. It is the same.", "gt-answer": "B. It is faster.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which statement accurately describes the speed of the earth above?\nA. It rotates at the same speed as the earth below.\nB. It rotates faster than the earth below.\nC. It rotates slower than the earth below.", "gt-answer": "B. It rotates faster than the earth below.", "video-llm-prediction": "A. It rotates at the same speed as the earth below.", "match_success": true, "rating": 0 } ] }, "15695290_concat_0": { "speed": [ { "question": "What is the speed of the person above when drawing a picture?\nA. faster than the person below\nB. at the same speed as the person below\nC. slower than the person below", "gt-answer": "B. at the same speed as the person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Comparing the speeds, how does the person above draw a picture compared to the person below?\nA. more slowly\nB. at an equal speed\nC. more rapidly", "gt-answer": "B. at an equal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the comparison of the speed of drawing, who is considered as faster?\nA. They draw at an equal rate\nB. The person below\nC. The person above", "gt-answer": "A. They draw at an equal rate", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "15695290_concat_1": { "speed": [ { "question": "What is the speed of the person above when drawing a picture?\nA. faster than the person below\nB. at the same speed as the person below\nC. slower than the person below", "gt-answer": "C. slower than the person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Comparing the speeds, how does the person above draw a picture compared to the person below?\nA. more rapidly\nB. at an equal speed\nC. more slowly", "gt-answer": "C. more slowly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the comparison of the speed of drawing, who is considered as faster?\nA. The person above\nB. They draw at an equal rate\nC. The person below", "gt-answer": "C. The person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "15695290_concat_2": { "speed": [ { "question": "What is the speed of the person above when drawing a picture?\nA. slower than the person below\nB. at the same speed as the person below\nC. faster than the person below", "gt-answer": "C. faster than the person below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Comparing the speeds, how does the person above draw a picture compared to the person below?\nA. at an equal speed\nB. more rapidly\nC. more slowly", "gt-answer": "B. more rapidly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the comparison of the speed of drawing, who is considered as faster?\nA. The person below\nB. They draw at an equal rate\nC. The person above", "gt-answer": "C. The person above", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1047368344_concat_0": { "speed": [ { "question": "What is the speed of the girl above?\nA. running at the same speed as the girl below\nB. running slower than the girl below\nC. running faster than the girl below", "gt-answer": "A. running at the same speed as the girl below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the speed of the girl above compare to the girl below?\nA. the same\nB. slower\nC. faster", "gt-answer": "A. the same", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How would you describe the speed of the girl above relative to the girl below?\nA. faster\nB. the same speed\nC. slower", "gt-answer": "B. the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1047368344_concat_1": { "speed": [ { "question": "What is the speed of the girl above?\nA. running slower than the girl below\nB. running at the same speed as the girl below\nC. running faster than the girl below", "gt-answer": "A. running slower than the girl below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the speed of the girl above compare to the girl below?\nA. faster\nB. slower\nC. the same", "gt-answer": "B. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the speed of the girl above relative to the girl below?\nA. slower\nB. faster\nC. the same speed", "gt-answer": "A. slower", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1047368344_concat_2": { "speed": [ { "question": "What is the speed of the girl above?\nA. running at the same speed as the girl below\nB. running slower than the girl below\nC. running faster than the girl below", "gt-answer": "C. running faster than the girl below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the girl above compare to the girl below?\nA. the same\nB. faster\nC. slower", "gt-answer": "B. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the speed of the girl above relative to the girl below?\nA. slower\nB. the same speed\nC. faster", "gt-answer": "C. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1060403198_concat_0": { "speed": [ { "question": "What is the speed of the tree above?\nA. growing slower than the tree below\nB. growing faster than the tree below\nC. growing at the same speed as the tree below", "gt-answer": "C. growing at the same speed as the tree below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the tree above grow compare to the tree below?\nA. slower\nB. at the same speed\nC. faster", "gt-answer": "B. at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which tree is growing at a higher speed - the tree above or the tree below?\nA. both trees grow at an equal speed\nB. the tree above\nC. the tree below", "gt-answer": "A. both trees grow at an equal speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1060403198_concat_1": { "speed": [ { "question": "What is the speed of the tree above?\nA. growing at the same speed as the tree below\nB. growing slower than the tree below\nC. growing faster than the tree below", "gt-answer": "C. growing faster than the tree below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the tree above grow compare to the tree below?\nA. faster\nB. at the same speed\nC. slower", "gt-answer": "A. faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which tree is growing at a higher speed - the tree above or the tree below?\nA. both trees grow at an equal speed\nB. the tree above\nC. the tree below", "gt-answer": "B. the tree above", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1060403198_concat_2": { "speed": [ { "question": "What is the speed of the tree above?\nA. growing faster than the tree below\nB. growing at the same speed as the tree below\nC. growing slower than the tree below", "gt-answer": "C. growing slower than the tree below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the tree above grow compare to the tree below?\nA. slower\nB. at the same speed\nC. faster", "gt-answer": "A. slower", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which tree is growing at a higher speed - the tree above or the tree below?\nA. the tree below\nB. both trees grow at an equal speed\nC. the tree above", "gt-answer": "A. the tree below", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1100058499_concat_0": { "speed": [ { "question": "What is the speed of the man above compared to the man below?\nA. jumping rope faster\nB. jumping rope at the same speed\nC. jumping rope slower", "gt-answer": "B. jumping rope at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the man above jump rope, relative to the man below?\nA. the same speed\nB. slower\nC. faster", "gt-answer": "A. the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which man is jumping rope at a slower speed?\nA. the man above\nB. both are jumping rope at the same speed\nC. the man below", "gt-answer": "B. both are jumping rope at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1100058499_concat_1": { "speed": [ { "question": "What is the speed of the man above compared to the man below?\nA. jumping rope faster\nB. jumping rope slower\nC. jumping rope at the same speed", "gt-answer": "B. jumping rope slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the man above jump rope, relative to the man below?\nA. the same speed\nB. slower\nC. faster", "gt-answer": "B. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which man is jumping rope at a slower speed?\nA. the man above\nB. the man below\nC. both are jumping rope at the same speed", "gt-answer": "A. the man above", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1100058499_concat_2": { "speed": [ { "question": "What is the speed of the man above compared to the man below?\nA. jumping rope faster\nB. jumping rope slower\nC. jumping rope at the same speed", "gt-answer": "A. jumping rope faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the man above jump rope, relative to the man below?\nA. the same speed\nB. slower\nC. faster", "gt-answer": "C. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which man is jumping rope at a slower speed?\nA. the man above\nB. the man below\nC. both are jumping rope at the same speed", "gt-answer": "B. the man below", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1092813279_concat_0": { "speed": [ { "question": "Which woman is doing push ups slower?\nA. the woman below\nB. two women doing push ups at the same speed\nC. the woman above", "gt-answer": "B. two women doing push ups at the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the speed of the woman above's push ups compared to the woman below?\nA. same speed\nB. faster\nC. slower", "gt-answer": "A. same speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Compared to the woman below, how would you describe the speed of the woman above's push ups?\nA. same speed\nB. faster\nC. slower", "gt-answer": "A. same speed", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1092813279_concat_1": { "speed": [ { "question": "Which woman is doing push ups slower?\nA. the woman below\nB. the woman above\nC. two women doing push ups at the same speed", "gt-answer": "B. the woman above", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the speed of the woman above's push ups compared to the woman below?\nA. faster\nB. slower\nC. same speed", "gt-answer": "B. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Compared to the woman below, how would you describe the speed of the woman above's push ups?\nA. faster\nB. same speed\nC. slower", "gt-answer": "C. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1092813279_concat_2": { "speed": [ { "question": "Which woman is doing push ups slower?\nA. the woman above\nB. two women doing push ups at the same speed\nC. the woman below", "gt-answer": "C. the woman below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the speed of the woman above's push ups compared to the woman below?\nA. same speed\nB. faster\nC. slower", "gt-answer": "B. faster", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Compared to the woman below, how would you describe the speed of the woman above's push ups?\nA. faster\nB. same speed\nC. slower", "gt-answer": "A. faster", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1084518106_concat_0": { "speed": [ { "question": "What is the speed of the truck above?\nA. driving at the same speed as the truck below\nB. driving faster than the truck below\nC. driving slower than the truck below", "gt-answer": "A. driving at the same speed as the truck below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How does the speed of the truck above compare to the truck below?\nA. the same speed\nB. slower\nC. faster", "gt-answer": "A. the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which truck is moving at a higher speed?\nA. the truck above\nB. the truck below\nC. they move a the same speed", "gt-answer": "C. they move a the same speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1084518106_concat_1": { "speed": [ { "question": "What is the speed of the truck above?\nA. driving slower than the truck below\nB. driving faster than the truck below\nC. driving at the same speed as the truck below", "gt-answer": "B. driving faster than the truck below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the truck above compare to the truck below?\nA. faster\nB. the same speed\nC. slower", "gt-answer": "A. faster", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which truck is moving at a higher speed?\nA. the truck below\nB. they move a the same speed\nC. the truck above", "gt-answer": "C. the truck above", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1084518106_concat_2": { "speed": [ { "question": "What is the speed of the truck above?\nA. driving faster than the truck below\nB. driving slower than the truck below\nC. driving at the same speed as the truck below", "gt-answer": "B. driving slower than the truck below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the speed of the truck above compare to the truck below?\nA. the same speed\nB. faster\nC. slower", "gt-answer": "C. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which truck is moving at a higher speed?\nA. the truck above\nB. the truck below\nC. they move a the same speed", "gt-answer": "B. the truck below", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1062609286_concat_0": { "speed": [ { "question": "What is happening to the battery charge above?\nA. increasing at a slower speed than the battery charge below\nB. increasing at a faster speed than the battery charge below\nC. increasing at the same speed as the battery charge below", "gt-answer": "C. increasing at the same speed as the battery charge below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be said about the speed at which the battery charge above is increasing?\nA. faster than the battery charge below\nB. slower than the battery charge below\nC. at an equal speed as the battery charge below", "gt-answer": "C. at an equal speed as the battery charge below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the charging speed below, how is the charging speed above?\nA. faster\nB. slower\nC. the same", "gt-answer": "C. the same", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1062609286_concat_1": { "speed": [ { "question": "What is happening to the battery charge above?\nA. increasing at a faster speed than the battery charge below\nB. increasing at the same speed as the battery charge below\nC. increasing at a slower speed than the battery charge below", "gt-answer": "C. increasing at a slower speed than the battery charge below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What can be said about the speed at which the battery charge above is increasing?\nA. at an equal speed as the battery charge below\nB. faster than the battery charge below\nC. slower than the battery charge below", "gt-answer": "C. slower than the battery charge below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the charging speed below, how is the charging speed above?\nA. the same\nB. slower\nC. faster", "gt-answer": "B. slower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1062609286_concat_2": { "speed": [ { "question": "What is happening to the battery charge above?\nA. increasing at a faster speed than the battery charge below\nB. increasing at a slower speed than the battery charge below\nC. increasing at the same speed as the battery charge below", "gt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What can be said about the speed at which the battery charge above is increasing?\nA. slower than the battery charge below\nB. faster than the battery charge below\nC. at an equal speed as the battery charge below", "gt-answer": "B. faster than the battery charge below", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In relation to the charging speed below, how is the charging speed above?\nA. the same\nB. slower\nC. faster", "gt-answer": "C. faster", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1111601171_reverse": { "attribute_change": [ { "question": "What is happening to the sphere building?\nA. It is changing from blue to red.\nB. It is changing from blue to green.\nC. It is changing from green to blue.\nD. It is staying in the same color.", "gt-answer": "B. It is changing from blue to green.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the final color of the sphere building?\nA. Red\nB. Green\nC. Blue\nD. Black", "gt-answer": "B. Green", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How is the sphere building transforming?\nA. It is staying in the same color.\nB. It is changing from green to blue.\nC. It is changing from red to yellow.\nD. It is changing from blue to green.", "gt-answer": "D. It is changing from blue to green.", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086105089_reverse": { "attribute_change": [ { "question": "What is happening to the building?\nA. being constructed\nB. grwoing wider\nC. demolishing", "gt-answer": "C. demolishing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the building changing?\nA. staying the same\nB. getting shorter\nC. growing taller", "gt-answer": "B. getting shorter", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is being done to the building?\nA. constructing\nB. renovating\nC. deconstructing", "gt-answer": "C. deconstructing", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1058498242_reverse": { "attribute_change": [ { "question": "What is happening to the 3d pixels?\nA. changing from a flat surface into a cuboid\nB. changing from a cuboid into a flat surface\nC. changing from a cuboid into the shape of a man\nD. changing from the shape of a man into a cuboid", "gt-answer": "D. changing from the shape of a man into a cuboid", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the 3d pixels transforming?\nA. changing from a sphere into a cuboid\nB. changing from a cuboid into a sphere\nC. changing from the shape of a man into a cuboid\nD. changing from a cuboid into the shape of a man", "gt-answer": "C. changing from the shape of a man into a cuboid", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what shape are the 3d pixels changing into?\nA. a tree\nB. a cuboid\nC. a sphere\nD. a man", "gt-answer": "B. a cuboid", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1082268005_reverse": { "attribute_change": [ { "question": "What is happening to the planet earth?\nA. assembling from toy bricks\nB. disassembling and disappearing\nC. splitting into two halves", "gt-answer": "B. disassembling and disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the planet earth changing?\nA. it is disappearing\nB. it is assembling from toy bricks\nC. it is spinning", "gt-answer": "A. it is disappearing", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "In what way is the planet earth transforming?\nA. it is disassembling and disappearing\nB. it is dissolving into water\nC. it is assembling from toy bricks", "gt-answer": "A. it is disassembling and disappearing", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1070711428_reverse": { "attribute_change": [ { "question": "What is happening to the glacier?\nA. assembling and rising from water\nB. breaking and falling in water\nC. freezing\nD. evaporating", "gt-answer": "A. assembling and rising from water", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What change is happening to the glacier?\nA. falling in water\nB. freezing\nC. rising from water\nD. becoming shorter", "gt-answer": "C. rising from water", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is occurring to the glacier?\nA. evaporating\nB. breaking and falling in water\nC. assembling and rising from water\nD. becoming shorter", "gt-answer": "C. assembling and rising from water", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1057447372_reverse": { "attribute_change": [ { "question": "What is happening to the sport stadium?\nA. turning darker\nB. staying the same brightness\nC. turning brighter", "gt-answer": "A. turning darker", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the sport stadium transforming?\nA. becoming brighter\nB. staying the same brightness\nC. becoming darker", "gt-answer": "C. becoming darker", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the alteration occurring in the sport stadium?\nA. turning brighter\nB. turning darker\nC. remaining the same", "gt-answer": "B. turning darker", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1053334574_reverse": { "attribute_change": [ { "question": "What is happening to the black ink?\nA. staying in the same shape\nB. splitting in half\nC. shrinking into the the center\nD. expanding from the center", "gt-answer": "C. shrinking into the the center", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the black ink transforming?\nA. staying in the same shape\nB. splitting in half\nC. contracting towards the center\nD. expanding from the center", "gt-answer": "C. contracting towards the center", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In what way is the black ink undergoing a change?\nA. drying up\nB. contracting into the center\nC. expanding from the center", "gt-answer": "B. contracting into the center", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1016172301_reverse": { "attribute_change": [ { "question": "What is happening to the 3D house model?\nA. being demolished\nB. being constructed\nC. being painted", "gt-answer": "A. being demolished", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which process is the 3D house model going through?\nA. being constructed\nB. being deconstructed\nC. being repaired", "gt-answer": "B. being deconstructed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What change is occurring to the 3D house model?\nA. being constructed\nB. being dismantled\nC. being renovated", "gt-answer": "B. being dismantled", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1084736389_reverse": { "attribute_change": [ { "question": "What is happening to the face?\nA. Aging\nB. Morphing from a chimpanzee into a human\nC. Morphing from a human into a chimpanzee\nD. Becoming younger", "gt-answer": "C. Morphing from a human into a chimpanzee", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the face transform?\nA. It morphs from a human into a chimpanzee\nB. It gets younger\nC. It morphs from a chimpanzee into a human\nD. It is aging", "gt-answer": "A. It morphs from a human into a chimpanzee", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which animal does the face resemble at the beginning?\nA. Chimpanzee\nB. Giraffe\nC. Human\nD. Tiger", "gt-answer": "C. Human", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1054494542_reverse": { "attribute_change": [ { "question": "What is happening to the background?\nA. changing from pink to green\nB. changing from green to pink\nC. changing from blue to pink\nD. changing from pink to blue", "gt-answer": "C. changing from blue to pink", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the background transforming?\nA. turning blue\nB. turning yellow\nC. truning pink\nD. turning green", "gt-answer": "C. truning pink", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the main change occurring in the background?\nA. changing from pink to blue\nB. changing from pink to green\nC. changing from blue to pink\nD. changing from green to pink", "gt-answer": "C. changing from blue to pink", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055194940_reverse": { "attribute_change": [ { "question": "What is happening to the insect?\nA. transforming from butterfly into pupa\nB. remaining as a butterfly\nC. remaining as a pupa\nD. transforming from pupa into butterfly", "gt-answer": "A. transforming from butterfly into pupa", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the final form of the insect after it undergoes transformation?\nA. pupa\nB. larva\nC. butterfly\nD. egg", "gt-answer": "A. pupa", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What change is occurring in the insect\nA. transforming from pupa into butterfly\nB. transforming from dead to live\nC. transforming from live to dead\nD. transforming from butterfly into pupa", "gt-answer": "D. transforming from butterfly into pupa", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1079384099_reverse": { "attribute_change": [ { "question": "What is happening to the 3d pixel? \nA. It is transforming from the shape of a heart into a triangle\nB. It is transforming from a triangle into the shape of a heart\nC. It is transforming from a white square into the shape of a flower\nD. It is transforming from the shape of a flower into a white square", "gt-answer": "D. It is transforming from the shape of a flower into a white square", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the final shape of the 3d pixel? \nA. A star\nB. A circle\nC. A flower\nD. A square", "gt-answer": "D. A square", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which shapes does the 3d pixel transform through? \nA. From flower to square\nB. From flower to heart\nC. From heart to flower\nD. From square to flower", "gt-answer": "A. From flower to square", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1099811331_reverse": { "attribute_change": [ { "question": "What is happening to the 3d heart?\nA. gradually disappearing\nB. gradually appearing\nC. growing in size\nD. Reducing in size", "gt-answer": "A. gradually disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the 3d heart transforming?\nA. gradually disappearing\nB. Reducing in size\nC. gradually appearing\nD. growing in size", "gt-answer": "A. gradually disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the attribute change of the 3d heart?\nA. gradually disappearing\nB. breaking apart\nC. gradually appearing\nD. splitting in half", "gt-answer": "A. gradually disappearing", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1093340469_reverse": { "attribute_change": [ { "question": "What is happening to the room?\nA. staying the same brightness\nB. turning brighter\nC. turning darker", "gt-answer": "B. turning brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which word best describes the change in the room?\nA. darkening\nB. stabilizing\nC. brightening", "gt-answer": "C. brightening", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the attribute of the room changing?\nA. becoming darker\nB. brightening up\nC. staying unchanged", "gt-answer": "A. becoming darker", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1111601171": { "attribute_change": [ { "question": "What is happening to the sphere building?\nA. It is changing from green to blue.\nB. It is changing from blue to green.\nC. It is changing from blue to red.\nD. It is staying in the same color.", "gt-answer": "A. It is changing from green to blue.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the final color of the sphere building?\nA. Red\nB. Green\nC. Blue\nD. Black", "gt-answer": "C. Blue", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "How is the sphere building transforming?\nA. It is changing from green to blue.\nB. It is staying in the same color.\nC. It is changing from blue to green.\nD. It is changing from red to yellow.", "gt-answer": "A. It is changing from green to blue.", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1086105089": { "attribute_change": [ { "question": "What is happening to the building?\nA. being constructed\nB. demolishing\nC. grwoing wider", "gt-answer": "A. being constructed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the building changing?\nA. growing taller\nB. staying the same\nC. getting shorter", "gt-answer": "A. growing taller", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is being done to the building?\nA. deconstructing\nB. constructing\nC. renovating", "gt-answer": "B. constructing", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1058498242": { "attribute_change": [ { "question": "What is happening to the 3d pixels?\nA. changing from a cuboid into a flat surface\nB. changing from the shape of a man into a cuboid\nC. changing from a cuboid into the shape of a man\nD. changing from a flat surface into a cuboid", "gt-answer": "C. changing from a cuboid into the shape of a man", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the 3d pixels transforming?\nA. changing from a cuboid into the shape of a man\nB. changing from a sphere into a cuboid\nC. changing from a cuboid into a sphere\nD. changing from the shape of a man into a cuboid", "gt-answer": "A. changing from a cuboid into the shape of a man", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what shape are the 3d pixels changing into?\nA. a cuboid\nB. a man\nC. a sphere\nD. a tree", "gt-answer": "B. a man", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1082268005": { "attribute_change": [ { "question": "What is happening to the planet earth?\nA. assembling from toy bricks\nB. disassembling and disappearing\nC. splitting into two halves", "gt-answer": "A. assembling from toy bricks", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the planet earth changing?\nA. it is spinning\nB. it is disappearing\nC. it is assembling from toy bricks", "gt-answer": "C. it is assembling from toy bricks", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In what way is the planet earth transforming?\nA. it is disassembling and disappearing\nB. it is dissolving into water\nC. it is assembling from toy bricks", "gt-answer": "C. it is assembling from toy bricks", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1070711428": { "attribute_change": [ { "question": "What is happening to the glacier?\nA. breaking and falling in water\nB. assembling and rising from water\nC. freezing\nD. evaporating", "gt-answer": "A. breaking and falling in water", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What change is happening to the glacier?\nA. falling in water\nB. rising from water\nC. becoming shorter\nD. freezing", "gt-answer": "A. falling in water", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is occurring to the glacier?\nA. breaking and falling in water\nB. becoming shorter\nC. assembling and rising from water\nD. evaporating", "gt-answer": "A. breaking and falling in water", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1057447372": { "attribute_change": [ { "question": "What is happening to the sport stadium?\nA. turning darker\nB. turning brighter\nC. staying the same brightness", "gt-answer": "B. turning brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the sport stadium transforming?\nA. staying the same brightness\nB. becoming darker\nC. becoming brighter", "gt-answer": "C. becoming brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the alteration occurring in the sport stadium?\nA. remaining the same\nB. turning darker\nC. turning brighter", "gt-answer": "C. turning brighter", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1053334574": { "attribute_change": [ { "question": "What is happening to the black ink?\nA. staying in the same shape\nB. shrinking into the the center\nC. splitting in half\nD. expanding from the center", "gt-answer": "D. expanding from the center", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the black ink transforming?\nA. splitting in half\nB. staying in the same shape\nC. expanding from the center\nD. contracting towards the center", "gt-answer": "C. expanding from the center", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what way is the black ink undergoing a change?\nA. drying up\nB. contracting into the center\nC. expanding from the center", "gt-answer": "C. expanding from the center", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1016172301": { "attribute_change": [ { "question": "What is happening to the 3D house model?\nA. being constructed\nB. being painted\nC. being demolished", "gt-answer": "A. being constructed", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which process is the 3D house model going through?\nA. being deconstructed\nB. being repaired\nC. being constructed", "gt-answer": "C. being constructed", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What change is occurring to the 3D house model?\nA. being renovated\nB. being constructed\nC. being dismantled", "gt-answer": "B. being constructed", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1084736389": { "attribute_change": [ { "question": "What is happening to the face?\nA. Aging\nB. Morphing from a chimpanzee into a human\nC. Becoming younger\nD. Morphing from a human into a chimpanzee", "gt-answer": "B. Morphing from a chimpanzee into a human", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the face transform?\nA. It morphs from a chimpanzee into a human\nB. It is aging\nC. It morphs from a human into a chimpanzee\nD. It gets younger", "gt-answer": "A. It morphs from a chimpanzee into a human", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which animal does the face resemble at the beginning?\nA. Human\nB. Giraffe\nC. Tiger\nD. Chimpanzee", "gt-answer": "D. Chimpanzee", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1054494542": { "attribute_change": [ { "question": "What is happening to the background?\nA. changing from pink to green\nB. changing from pink to blue\nC. changing from green to pink\nD. changing from blue to pink", "gt-answer": "B. changing from pink to blue", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How is the background transforming?\nA. turning green\nB. truning pink\nC. turning yellow\nD. turning blue", "gt-answer": "D. turning blue", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "What is the main change occurring in the background?\nA. changing from green to pink\nB. changing from pink to green\nC. changing from blue to pink\nD. changing from pink to blue", "gt-answer": "D. changing from pink to blue", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055194940": { "attribute_change": [ { "question": "What is happening to the insect?\nA. remaining as a butterfly\nB. transforming from butterfly into pupa\nC. transforming from pupa into butterfly\nD. remaining as a pupa", "gt-answer": "C. transforming from pupa into butterfly", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the final form of the insect after it undergoes transformation?\nA. larva\nB. pupa\nC. butterfly\nD. egg", "gt-answer": "C. butterfly", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What change is occurring in the insect\nA. transforming from butterfly into pupa\nB. transforming from dead to live\nC. transforming from live to dead\nD. transforming from pupa into butterfly", "gt-answer": "D. transforming from pupa into butterfly", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1079384099": { "attribute_change": [ { "question": "What is happening to the 3d pixel? \nA. It is transforming from a white square into the shape of a flower\nB. It is transforming from a triangle into the shape of a heart\nC. It is transforming from the shape of a heart into a triangle\nD. It is transforming from the shape of a flower into a white square", "gt-answer": "A. It is transforming from a white square into the shape of a flower", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the final shape of the 3d pixel? \nA. A flower\nB. A star\nC. A circle\nD. A square", "gt-answer": "A. A flower", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which shapes does the 3d pixel transform through? \nA. From flower to square\nB. From flower to heart\nC. From heart to flower\nD. From square to flower", "gt-answer": "D. From square to flower", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1099811331": { "attribute_change": [ { "question": "What is happening to the 3d heart?\nA. Reducing in size\nB. gradually disappearing\nC. gradually appearing\nD. growing in size", "gt-answer": "C. gradually appearing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the 3d heart transforming?\nA. gradually disappearing\nB. growing in size\nC. gradually appearing\nD. Reducing in size", "gt-answer": "C. gradually appearing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the attribute change of the 3d heart?\nA. gradually appearing\nB. splitting in half\nC. gradually disappearing\nD. breaking apart", "gt-answer": "A. gradually appearing", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1093340469": { "attribute_change": [ { "question": "What is happening to the room?\nA. staying the same brightness\nB. turning brighter\nC. turning darker", "gt-answer": "C. turning darker", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which word best describes the change in the room?\nA. darkening\nB. brightening\nC. stabilizing", "gt-answer": "A. darkening", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How is the attribute of the room changing?\nA. staying unchanged\nB. brightening up\nC. becoming darker", "gt-answer": "C. becoming darker", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_0": { "order": [ { "question": "What is the order of events in the video?\nA. Sun rising and then ice cream melting\nB. Ice cream melting and then sun rising\nC. Sun rising and ice cream melting at the same time", "gt-answer": "C. Sun rising and ice cream melting at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Both events happen simultaneously\nB. Sun rising\nC. Ice cream melting", "gt-answer": "A. Both events happen simultaneously", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video?\nA. Both events occur at the same time\nB. Ice cream melting, sun rising\nC. Sun rising, ice cream melting", "gt-answer": "A. Both events occur at the same time", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_1": { "order": [ { "question": "What is the order of events in the video?\nA. Sun rising and ice cream melting at the same time\nB. Sun rising and then ice cream melting\nC. Ice cream melting and then sun rising", "gt-answer": "C. Ice cream melting and then sun rising", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Sun rising\nB. Ice cream melting\nC. Both events happen simultaneously", "gt-answer": "B. Ice cream melting", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur in the video?\nA. Ice cream melting, sun rising\nB. Sun rising, ice cream melting\nC. Both events occur at the same time", "gt-answer": "A. Ice cream melting, sun rising", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1059072773_1059718130_2": { "order": [ { "question": "What is the order of events in the video?\nA. Sun rising and ice cream melting at the same time\nB. Sun rising and then ice cream melting\nC. Ice cream melting and then sun rising", "gt-answer": "B. Sun rising and then ice cream melting", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Both events happen simultaneously\nB. Sun rising\nC. Ice cream melting", "gt-answer": "B. Sun rising", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video?\nA. Sun rising, ice cream melting\nB. Ice cream melting, sun rising\nC. Both events occur at the same time", "gt-answer": "A. Sun rising, ice cream melting", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1024867412_1034049020_0": { "order": [ { "question": "What is the order of events in the video?\nA. A girl is walking on the street while a dog is simultaneously driving\nB. A girl is walking on the street, then a dog is driving\nC. A dog is driving, then a girl is walking on the street", "gt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A. A girl is walking on the street while a dog is simultaneously driving.", "match_success": true, "rating": 1 }, { "question": "Which event happens first in the video?\nA. A dog is driving\nB. Both events happen concurrently\nC. A girl is walking on the street", "gt-answer": "B. Both events happen concurrently", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video?A. A dog is driving, followed by a girl walking on the street\nA. A girl is walking on the street while a dog is driving at the same time\nB. A girl is walking on the street, followed by a dog driving", "gt-answer": "A. A girl is walking on the street while a dog is driving at the same time", "video-llm-prediction": "A. A dog is driving, followed by a girl walking on the street.", "match_success": true, "rating": 1 } ] }, "1024867412_1034049020_1": { "order": [ { "question": "What is the order of events in the video?\nA. A dog is driving, then a girl is walking on the street\nB. A girl is walking on the street, then a dog is driving\nC. A girl is walking on the street while a dog is simultaneously driving", "gt-answer": "A. A dog is driving, then a girl is walking on the street", "video-llm-prediction": "A. A dog is driving, then a girl is walking on the street.", "match_success": true, "rating": 1 }, { "question": "Which event happens first in the video?\nA. A dog is driving\nB. A girl is walking on the street\nC. Both events happen concurrently", "gt-answer": "A. A dog is driving", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur in the video?\nA. A dog is driving, followed by a girl walking on the street\nB. A girl is walking on the street, followed by a dog driving\nC. A girl is walking on the street while a dog is driving at the same time", "gt-answer": "A. A dog is driving, followed by a girl walking on the street", "video-llm-prediction": "A. A dog is driving, followed by a girl walking on the street.", "match_success": true, "rating": 1 } ] }, "1024867412_1034049020_2": { "order": [ { "question": "What is the order of events in the video?\nA. A girl is walking on the street, then a dog is driving\nB. A girl is walking on the street while a dog is simultaneously driving\nC. A dog is driving, then a girl is walking on the street", "gt-answer": "A. A girl is walking on the street, then a dog is driving", "video-llm-prediction": "A. A girl is walking on the street, then a dog is driving.", "match_success": true, "rating": 1 }, { "question": "Which event happens first in the video?\nA. A girl is walking on the street\nB. A dog is driving\nC. Both events happen concurrently", "gt-answer": "A. A girl is walking on the street", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur in the video?A. A dog is driving, followed by a girl walking on the street\nA. A girl is walking on the street, followed by a dog driving\nB. A girl is walking on the street while a dog is driving at the same time", "gt-answer": "A. A girl is walking on the street, followed by a dog driving", "video-llm-prediction": "A. A dog is driving, followed by a girl walking on the street.", "match_success": true, "rating": 1 } ] }, "1096238125_1098970151_0": { "order": [ { "question": "What is the order of the events in the video?\nA. Two people are lifting weights and then a cat is licking its paw\nB. The events are happening simultaneously, there is no specific order\nC. A cat is licking its paw and then two people are lifting weights", "gt-answer": "B. The events are happening simultaneously, there is no specific order", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. A cat is licking its paw\nB. Two people are lifting weights\nC. Both events happen at the same time", "gt-answer": "C. Both events happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what order do the events take place in the video?\nA. The events happen simultaneously\nB. Two people are lifting weights followed by a cat licking its paw\nC. A cat is licking its paw followed by two people lifting weights", "gt-answer": "A. The events happen simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1096238125_1098970151_1": { "order": [ { "question": "What is the order of the events in the video?\nA. A cat is licking its paw and then two people are lifting weights\nB. Two people are lifting weights and then a cat is licking its paw\nC. The events are happening simultaneously, there is no specific order", "gt-answer": "B. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Two people are lifting weights\nB. Both events happen at the same time\nC. A cat is licking its paw", "gt-answer": "A. Two people are lifting weights", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In what order do the events take place in the video?\nA. Two people are lifting weights followed by a cat licking its paw\nB. The events happen simultaneously\nC. A cat is licking its paw followed by two people lifting weights", "gt-answer": "A. Two people are lifting weights followed by a cat licking its paw", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1096238125_1098970151_2": { "order": [ { "question": "What is the order of the events in the video?\nA. Two people are lifting weights and then a cat is licking its paw\nB. A cat is licking its paw and then two people are lifting weights\nC. The events are happening simultaneously, there is no specific order", "gt-answer": "B. A cat is licking its paw and then two people are lifting weights", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Two people are lifting weights\nB. Both events happen at the same time\nC. A cat is licking its paw", "gt-answer": "C. A cat is licking its paw", "video-llm-prediction": "A. Two people are lifting weights", "match_success": true, "rating": 0 }, { "question": "In what order do the events take place in the video?\nA. The events happen simultaneously\nB. Two people are lifting weights followed by a cat licking its paw\nC. A cat is licking its paw followed by two people lifting weights", "gt-answer": "C. A cat is licking its paw followed by two people lifting weights", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_0": { "order": [ { "question": "What is the order of events in the video?\nA. First, a woman is showing different expressions; then, a man is showing different expressions.\nB. First, a man is showing different expressions; then, a woman is showing different expressions.\nC. Both the woman and the man are showing different expressions at the same time.", "gt-answer": "C. Both the woman and the man are showing different expressions at the same time.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence are the events presented in the video?\nA. The man presents his expressions first, followed by the woman.\nB. The woman presents his expressions first, followed by the man.\nC. The woman and man are showing their expressions simultaneously.", "gt-answer": "C. The woman and man are showing their expressions simultaneously.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs earlier in the video?\nA. The man showing different expressions\nB. They both happen together\nC. The woman showing different expressions", "gt-answer": "B. They both happen together", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_1": { "order": [ { "question": "What is the order of events in the video?\nA. First, a man is showing different expressions; then, a woman is showing different expressions.\nB. First, a woman is showing different expressions; then, a man is showing different expressions.\nC. Both the woman and the man are showing different expressions at the same time.", "gt-answer": "B. First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "A. First, a man is showing different expressions; then, a woman is showing different expressions.", "match_success": true, "rating": 0 }, { "question": "In what sequence are the events presented in the video?\nA. The woman and man are showing their expressions simultaneously.\nB. The man presents his expressions first, followed by the woman.\nC. The woman presents his expressions first, followed by the man.", "gt-answer": "C. The woman presents his expressions first, followed by the man.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs earlier in the video?\nA. The man showing different expressions\nB. The woman showing different expressions\nC. They both happen together", "gt-answer": "B. The woman showing different expressions", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_2": { "order": [ { "question": "What is the order of events in the video?\nA. First, a woman is showing different expressions; then, a man is showing different expressions.\nB. Both the woman and the man are showing different expressions at the same time.\nC. First, a man is showing different expressions; then, a woman is showing different expressions.", "gt-answer": "C. First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence are the events presented in the video?\nA. The man presents his expressions first, followed by the woman.\nB. The woman presents his expressions first, followed by the man.\nC. The woman and man are showing their expressions simultaneously.", "gt-answer": "A. The man presents his expressions first, followed by the woman.", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event occurs earlier in the video?\nA. The woman showing different expressions\nB. They both happen together\nC. The man showing different expressions", "gt-answer": "C. The man showing different expressions", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_0": { "order": [ { "question": "What is the correct order of events in the video?\nA. The fire ball is expanding, then the earth is spinning\nB. The earth is spinning, then the fire ball is expanding\nC. Simultaneously, the earth is spinning and the fire ball is expanding", "gt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the first event of the video?\nA. Both events happen together\nB. The fire ball is expanding\nC. The earth is spinning", "gt-answer": "A. Both events happen together", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is happening in the second event of the video?\nA. The earth is spinning\nB. The fire ball is expanding\nC. Both events happen together", "gt-answer": "C. Both events happen together", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_1": { "order": [ { "question": "What is the correct order of events in the video?\nA. The fire ball is expanding, then the earth is spinning\nB. The earth is spinning, then the fire ball is expanding\nC. Simultaneously, the earth is spinning and the fire ball is expanding", "gt-answer": "B. The earth is spinning, then the fire ball is expanding", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the first event of the video?\nA. The earth is spinning\nB. Both events happen together\nC. The fire ball is expanding", "gt-answer": "A. The earth is spinning", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening in the second event of the video?\nA. Both events happen together\nB. The earth is spinning\nC. The fire ball is expanding", "gt-answer": "C. The fire ball is expanding", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1055413730_1055973887_2": { "order": [ { "question": "What is the correct order of events in the video?\nA. Simultaneously, the earth is spinning and the fire ball is expanding\nB. The fire ball is expanding, then the earth is spinning\nC. The earth is spinning, then the fire ball is expanding", "gt-answer": "B. The fire ball is expanding, then the earth is spinning", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the first event of the video?\nA. The fire ball is expanding\nB. Both events happen together\nC. The earth is spinning", "gt-answer": "A. The fire ball is expanding", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening in the second event of the video?\nA. The fire ball is expanding\nB. The earth is spinning\nC. Both events happen together", "gt-answer": "B. The earth is spinning", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_0": { "order": [ { "question": "What is the order of events in the video?\nA. A person is picking up a pineapple and then a squirrel is foraging\nB. A squirrel is foraging and then a person is picking up a pineapple\nC. Both events are happening concurrently", "gt-answer": "C. Both events are happening concurrently", "video-llm-prediction": "A. A person is picking up a pineapple and then a squirrel is foraging", "match_success": true, "rating": 0 }, { "question": "In what sequence are the events happening in the video?\nA. First, a person is picking up a pineapple; then, a squirrel is foraging\nB. First, a squirrel is foraging; then, a person is picking up a pineapple\nC. Both events are happening simultaneously", "gt-answer": "C. Both events are happening simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the arrangement of the events in the video?\nA. A person picks up a pineapple before a squirrel starts foraging\nB. They happen at exactly the same time\nC. A squirrel is foraging before a person picks up a pineapple", "gt-answer": "B. They happen at exactly the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_1": { "order": [ { "question": "What is the order of events in the video?\nA. Both events are happening concurrently\nB. A squirrel is foraging and then a person is picking up a pineapple\nC. A person is picking up a pineapple and then a squirrel is foraging", "gt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "A. Both events are happening concurrently", "match_success": true, "rating": 0 }, { "question": "In what sequence are the events happening in the video?\nA. First, a squirrel is foraging; then, a person is picking up a pineapple\nB. Both events are happening simultaneously\nC. First, a person is picking up a pineapple; then, a squirrel is foraging", "gt-answer": "A. First, a squirrel is foraging; then, a person is picking up a pineapple", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the arrangement of the events in the video?\nA. A squirrel is foraging before a person picks up a pineapple\nB. A person picks up a pineapple before a squirrel starts foraging\nC. They happen at exactly the same time", "gt-answer": "A. A squirrel is foraging before a person picks up a pineapple", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1058907236_1021488277_2": { "order": [ { "question": "What is the order of events in the video?\nA. Both events are happening concurrently\nB. A person is picking up a pineapple and then a squirrel is foraging\nC. A squirrel is foraging and then a person is picking up a pineapple", "gt-answer": "B. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "In what sequence are the events happening in the video?\nA. Both events are happening simultaneously\nB. First, a squirrel is foraging; then, a person is picking up a pineapple\nC. First, a person is picking up a pineapple; then, a squirrel is foraging", "gt-answer": "C. First, a person is picking up a pineapple; then, a squirrel is foraging", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the arrangement of the events in the video?\nA. A squirrel is foraging before a person picks up a pineapple\nB. They happen at exactly the same time\nC. A person picks up a pineapple before a squirrel starts foraging", "gt-answer": "C. A person picks up a pineapple before a squirrel starts foraging", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1054717541_1047368344_0": { "order": [ { "question": "What is the sequence of events in the video?\nA. a girl jumping into water followed by a person kneading dough\nB. a person is kneading dough followed by a girl jumping into water\nC. a girl jumping into water while a person kneading dough", "gt-answer": "C. a girl jumping into water while a person kneading dough", "video-llm-prediction": "A. a girl jumping into water followed by a person kneading dough", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. a person is kneading dough\nB. a girl is jumping into water\nC. Both events occur at the same time", "gt-answer": "C. Both events occur at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event occurs second in the video?\nA. Both events occur at the same time\nB. a girl is jumping into water\nC. a person is kneading dough", "gt-answer": "A. Both events occur at the same time", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1054717541_1047368344_1": { "order": [ { "question": "What is the sequence of events in the video?\nA. a person is kneading dough followed by a girl jumping into water\nB. a girl jumping into water followed by a person kneading dough\nC. a girl jumping into water while a person kneading dough", "gt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "A. a person is kneading dough followed by a girl jumping into water", "match_success": true, "rating": 1 }, { "question": "What is happening first in the video?\nA. Both events occur at the same time\nB. a person is kneading dough\nC. a girl is jumping into water", "gt-answer": "B. a person is kneading dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What event occurs second in the video?\nA. a person is kneading dough\nB. a girl is jumping into water\nC. Both events occur at the same time", "gt-answer": "B. a girl is jumping into water", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1054717541_1047368344_2": { "order": [ { "question": "What is the sequence of events in the video?\nA. a person is kneading dough followed by a girl jumping into water\nB. a girl jumping into water followed by a person kneading dough\nC. a girl jumping into water while a person kneading dough", "gt-answer": "B. a girl jumping into water followed by a person kneading dough", "video-llm-prediction": "A. a person is kneading dough followed by a girl jumping into water.", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. a girl is jumping into water\nB. a person is kneading dough\nC. Both events occur at the same time", "gt-answer": "A. a girl is jumping into water", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What event occurs second in the video?\nA. a girl is jumping into water\nB. Both events occur at the same time\nC. a person is kneading dough", "gt-answer": "C. a person is kneading dough", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1089201973_1086820415_0": { "order": [ { "question": "What is the order of events in the video?\nA. A person is kicking football and then a big wave is shown\nB. The events are shown simultaneously\nC. A big wave is shown and then a person is kicking football", "gt-answer": "B. The events are shown simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event is shown first in the video?\nA. A big wave is shown\nB. Both events happen simultaneously\nC. A person is kicking football", "gt-answer": "B. Both events happen simultaneously", "video-llm-prediction": "A. A big wave is shown", "match_success": true, "rating": 0 }, { "question": "Which event is shown second in the video?\nA. Both events happen simultaneously\nB. A big wave is shown\nC. A person is kicking football", "gt-answer": "A. Both events happen simultaneously", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1089201973_1086820415_1": { "order": [ { "question": "What is the order of events in the video?\nA. The events are shown simultaneously\nB. A big wave is shown and then a person is kicking football\nC. A person is kicking football and then a big wave is shown", "gt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event is shown first in the video?\nA. Both events happen simultaneously\nB. A big wave is shown\nC. A person is kicking football", "gt-answer": "C. A person is kicking football", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which event is shown second in the video?\nA. A person is kicking football\nB. Both events happen simultaneously\nC. A big wave is shown", "gt-answer": "C. A big wave is shown", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1089201973_1086820415_2": { "order": [ { "question": "What is the order of events in the video?\nA. A big wave is shown and then a person is kicking football\nB. The events are shown simultaneously\nC. A person is kicking football and then a big wave is shown", "gt-answer": "A. A big wave is shown and then a person is kicking football", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What event is shown first in the video?\nA. A big wave is shown\nB. A person is kicking football\nC. Both events happen simultaneously", "gt-answer": "A. A big wave is shown", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event is shown second in the video?\nA. A person is kicking football\nB. Both events happen simultaneously\nC. A big wave is shown", "gt-answer": "A. A person is kicking football", "video-llm-prediction": "A. A person is kicking football", "match_success": true, "rating": 1 } ] }, "1080990179_1086820415_0": { "order": [ { "question": "What is the order of events in the video?\nA. At the same time, an apple is drying out and a big wave is shown\nB. A big wave is shown and then an apple is drying out\nC. An apple is drying out and then a big wave is shown", "gt-answer": "A. At the same time, an apple is drying out and a big wave is shown", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event occurs first in the video?\nA. A big wave is shown\nB. Both events occur simultaneously\nC. An apple is drying out", "gt-answer": "B. Both events occur simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs later in the video?\nA. Both events occur simultaneously\nB. An apple is drying out\nC. A big wave is shown", "gt-answer": "A. Both events occur simultaneously", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1080990179_1086820415_1": { "order": [ { "question": "What is the order of events in the video?\nA. An apple is drying out and then a big wave is shown\nB. A big wave is shown and then an apple is drying out\nC. At the same time, an apple is drying out and a big wave is shown", "gt-answer": "A. An apple is drying out and then a big wave is shown", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event occurs first in the video?\nA. Both events occur simultaneously\nB. An apple is drying out\nC. A big wave is shown", "gt-answer": "B. An apple is drying out", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which event occurs later in the video?\nA. An apple is drying out\nB. A big wave is shown\nC. Both events occur simultaneously", "gt-answer": "B. A big wave is shown", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1080990179_1086820415_2": { "order": [ { "question": "What is the order of events in the video?\nA. At the same time, an apple is drying out and a big wave is shown\nB. A big wave is shown and then an apple is drying out\nC. An apple is drying out and then a big wave is shown", "gt-answer": "B. A big wave is shown and then an apple is drying out", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs first in the video?\nA. An apple is drying out\nB. Both events occur simultaneously\nC. A big wave is shown", "gt-answer": "C. A big wave is shown", "video-llm-prediction": "A. An apple is drying out", "match_success": true, "rating": 0 }, { "question": "Which event occurs later in the video?\nA. An apple is drying out\nB. Both events occur simultaneously\nC. A big wave is shown", "gt-answer": "A. An apple is drying out", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1067268403_1064645467_0": { "order": [ { "question": "What is the order of events in the video?\nA. Wind turbines are rotating followed by a man doing exercise\nB. A man doing exercise followed by wind turbines rotating\nC. A man doing exercise and wind turbines rotating concurrently", "gt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the first event of the video?\nA. A man is doing exercise while wind turbines are rotating\nB. Wind turbines are rotating\nC. A man is doing exercise", "gt-answer": "A. A man is doing exercise while wind turbines are rotating", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening in the second event of the video?\nA. Wind turbines are rotating\nB. A man is doing exercise while wind turbines are rotating\nC. A man is doing exercise", "gt-answer": "B. A man is doing exercise while wind turbines are rotating", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1067268403_1064645467_1": { "order": [ { "question": "What is the order of events in the video?\nA. A man doing exercise and wind turbines rotating concurrently\nB. A man doing exercise followed by wind turbines rotating\nC. Wind turbines are rotating followed by a man doing exercise", "gt-answer": "C. Wind turbines are rotating followed by a man doing exercise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the first event of the video?\nA. Wind turbines are rotating\nB. A man is doing exercise while wind turbines are rotating\nC. A man is doing exercise", "gt-answer": "A. Wind turbines are rotating", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening in the second event of the video?\nA. Wind turbines are rotating\nB. A man is doing exercise while wind turbines are rotating\nC. A man is doing exercise", "gt-answer": "C. A man is doing exercise", "video-llm-prediction": "A. Wind turbines are rotating", "match_success": true, "rating": 0 } ] }, "1067268403_1064645467_2": { "order": [ { "question": "What is the order of events in the video?\nA. A man doing exercise and wind turbines rotating concurrently\nB. A man doing exercise followed by wind turbines rotating\nC. Wind turbines are rotating followed by a man doing exercise", "gt-answer": "B. A man doing exercise followed by wind turbines rotating", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the first event of the video?\nA. A man is doing exercise while wind turbines are rotating\nB. A man is doing exercise\nC. Wind turbines are rotating", "gt-answer": "B. A man is doing exercise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening in the second event of the video?\nA. A man is doing exercise while wind turbines are rotating\nB. Wind turbines are rotating\nC. A man is doing exercise", "gt-answer": "B. Wind turbines are rotating", "video-llm-prediction": "A. A man is doing exercise while wind turbines are rotating", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_0": { "order": [ { "question": "What is the order of events in the video?\nA. The events are happening simultaneously\nB. planet earth is assembling from toy bricks and then viruses are dissolving\nC. viruses are dissolving and then planet earth is assembling from toy bricks", "gt-answer": "A. The events are happening simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the first event in the video?\nA. planet earth is assembling from toy bricks\nB. viruses are dissolving\nC. The events are happening simultaneously", "gt-answer": "C. The events are happening simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs last in the video?\nA. The events are happening simultaneously\nB. planet earth is assembling from toy bricks\nC. viruses are dissolving", "gt-answer": "A. The events are happening simultaneously", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_1": { "order": [ { "question": "What is the order of events in the video?\nA. planet earth is assembling from toy bricks and then viruses are dissolving\nB. viruses are dissolving and then planet earth is assembling from toy bricks\nC. The events are happening simultaneously", "gt-answer": "A. planet earth is assembling from toy bricks and then viruses are dissolving", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the first event in the video?\nA. planet earth is assembling from toy bricks\nB. viruses are dissolving\nC. The events are happening simultaneously", "gt-answer": "A. planet earth is assembling from toy bricks", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event occurs last in the video?\nA. The events are happening simultaneously\nB. planet earth is assembling from toy bricks\nC. viruses are dissolving", "gt-answer": "C. viruses are dissolving", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_2": { "order": [ { "question": "What is the order of events in the video?\nA. viruses are dissolving and then planet earth is assembling from toy bricks\nB. The events are happening simultaneously\nC. planet earth is assembling from toy bricks and then viruses are dissolving", "gt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the first event in the video?\nA. planet earth is assembling from toy bricks\nB. The events are happening simultaneously\nC. viruses are dissolving", "gt-answer": "C. viruses are dissolving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs last in the video?\nA. planet earth is assembling from toy bricks\nB. viruses are dissolving\nC. The events are happening simultaneously", "gt-answer": "A. planet earth is assembling from toy bricks", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1060403198_1049965795_0": { "order": [ { "question": "What is the order of events in the video?\nA. A light bulb is lighting up and then the tree is growing up\nB. The tree is growing up and then a light bulb is lighting up\nC. Both events happen at the same time", "gt-answer": "C. Both events happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur?\nA. A light bulb is lighting up and then the tree is growing up\nB. The tree is growing up and then a light bulb is lighting up\nC. Both events happen at the same time", "gt-answer": "C. Both events happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the events ordered in the video?\nA. A light bulb is lighting up and then the tree is growing up\nB. Both events happen at the same time\nC. The tree is growing up and then a light bulb is lighting up", "gt-answer": "B. Both events happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_1": { "order": [ { "question": "What is the order of events in the video?\nA. The tree is growing up and then a light bulb is lighting up\nB. Both events happen at the same time\nC. A light bulb is lighting up and then the tree is growing up", "gt-answer": "A. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur?\nA. Both events happen at the same time\nB. The tree is growing up and then a light bulb is lighting up\nC. A light bulb is lighting up and then the tree is growing up", "gt-answer": "B. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the events ordered in the video?\nA. A light bulb is lighting up and then the tree is growing up\nB. Both events happen at the same time\nC. The tree is growing up and then a light bulb is lighting up", "gt-answer": "C. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_2": { "order": [ { "question": "What is the order of events in the video?\nA. A light bulb is lighting up and then the tree is growing up\nB. The tree is growing up and then a light bulb is lighting up\nC. Both events happen at the same time", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur?\nA. A light bulb is lighting up and then the tree is growing up\nB. The tree is growing up and then a light bulb is lighting up\nC. Both events happen at the same time", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "How are the events ordered in the video?\nA. A light bulb is lighting up and then the tree is growing up\nB. The tree is growing up and then a light bulb is lighting up\nC. Both events happen at the same time", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1091143117_1094219575_0": { "order": [ { "question": "What is the order of events in the video?\nA. An eye is opening first, then a flower is wilting\nB. A flower is wilting first, then an eye is opening\nC. Both events happen simultaneously", "gt-answer": "C. Both events happen simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. A flower is wilting\nB. Both events happen at the same time\nC. An eye is opening", "gt-answer": "B. Both events happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what order do the events occur in the video?\nA. Both events happen at the same time\nB. A flower is wilting followed by an eye is opening\nC. An eye is opening followed by a flower is wilting", "gt-answer": "A. Both events happen at the same time", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1091143117_1094219575_1": { "order": [ { "question": "What is the order of events in the video?\nA. An eye is opening first, then a flower is wilting\nB. Both events happen simultaneously\nC. A flower is wilting first, then an eye is opening", "gt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event happens first in the video?\nA. A flower is wilting\nB. An eye is opening\nC. Both events happen at the same time", "gt-answer": "B. An eye is opening", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what order do the events occur in the video?\nA. An eye is opening followed by a flower is wilting\nB. Both events happen at the same time\nC. A flower is wilting followed by an eye is opening", "gt-answer": "A. An eye is opening followed by a flower is wilting", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1091143117_1094219575_2": { "order": [ { "question": "What is the order of events in the video?\nA. An eye is opening first, then a flower is wilting\nB. Both events happen simultaneously\nC. A flower is wilting first, then an eye is opening", "gt-answer": "C. A flower is wilting first, then an eye is opening", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. A flower is wilting\nB. An eye is opening\nC. Both events happen at the same time", "gt-answer": "A. A flower is wilting", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what order do the events occur in the video?\nA. A flower is wilting followed by an eye is opening\nB. An eye is opening followed by a flower is wilting\nC. Both events happen at the same time", "gt-answer": "A. A flower is wilting followed by an eye is opening", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1086105089_1085910917_0": { "order": [ { "question": "What order do the events occur in?\nA. First, a building is being constructed; then, a woman is drinking water.\nB. First, a woman is drinking water; then, a building is being constructed.\nC. Both events happen simultaneously.", "gt-answer": "C. Both events happen simultaneously.", "video-llm-prediction": "A. First, a building is being constructed; then, a woman is drinking water.", "match_success": true, "rating": 0 }, { "question": "Which event happens before the other?\nA. A building is being constructed happens before a woman is drinking water.\nB. Both events happen at the same time.\nC. A woman is drinking water happens before a building is being constructed.", "gt-answer": "B. Both events happen at the same time.", "video-llm-prediction": "A. A building is being constructed happens before a woman is drinking water.", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur?\nA. A building is being constructed comes first, followed by a woman drinking water.\nB. A woman is drinking water comes first, followed by a building being constructed.\nC. The events happen simultaneously.", "gt-answer": "C. The events happen simultaneously.", "video-llm-prediction": "A.", "match_success": true, "rating": 0 } ] }, "1086105089_1085910917_1": { "order": [ { "question": "What order do the events occur in?\nA. First, a building is being constructed; then, a woman is drinking water.\nB. Both events happen simultaneously.\nC. First, a woman is drinking water; then, a building is being constructed.", "gt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "A. First, a building is being constructed; then, a woman is drinking water.", "match_success": true, "rating": 1 }, { "question": "Which event happens before the other?\nA. A building is being constructed happens before a woman is drinking water.\nB. A woman is drinking water happens before a building is being constructed.\nC. Both events happen at the same time.", "gt-answer": "A. A building is being constructed happens before a woman is drinking water.", "video-llm-prediction": "A. A building is being constructed happens before a woman is drinking water.", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur?\nA. A woman is drinking water comes first, followed by a building being constructed.\nB. A building is being constructed comes first, followed by a woman drinking water.\nC. The events happen simultaneously.", "gt-answer": "B. A building is being constructed comes first, followed by a woman drinking water.", "video-llm-prediction": "A.", "match_success": true, "rating": 0 } ] }, "1086105089_1085910917_2": { "order": [ { "question": "What order do the events occur in?\nA. First, a building is being constructed; then, a woman is drinking water.\nB. First, a woman is drinking water; then, a building is being constructed.\nC. Both events happen simultaneously.", "gt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "A. First, a building is being constructed; then, a woman is drinking water.", "match_success": true, "rating": 0 }, { "question": "Which event happens before the other?\nA. Both events happen at the same time.\nB. A woman is drinking water happens before a building is being constructed.\nC. A building is being constructed happens before a woman is drinking water.", "gt-answer": "B. A woman is drinking water happens before a building is being constructed.", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur?\nA. A building is being constructed comes first, followed by a woman drinking water.\nB. A woman is drinking water comes first, followed by a building being constructed.\nC. The events happen simultaneously.", "gt-answer": "B. A woman is drinking water comes first, followed by a building being constructed.", "video-llm-prediction": "A. A building is being constructed comes first, followed by a woman drinking water.", "match_success": true, "rating": 0 } ] }, "1034736653_1043054206_0": { "order": [ { "question": "In what order do the events occur in the video?\nA. Women running, then cars racing\nB. They happen simultaneously\nC. Cars racing, then women running", "gt-answer": "B. They happen simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. They happen simultaneously\nB. Cars are racing\nC. Women are running", "gt-answer": "A. They happen simultaneously", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which event happens last in the video?\nA. Cars are racing\nB. Women are running\nC. They happen at the same time", "gt-answer": "C. They happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1034736653_1043054206_1": { "order": [ { "question": "In what order do the events occur in the video?\nA. Cars racing, then women running\nB. Women running, then cars racing\nC. They happen simultaneously", "gt-answer": "B. Women running, then cars racing", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. They happen simultaneously\nB. Cars are racing\nC. Women are running", "gt-answer": "C. Women are running", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which event happens last in the video?\nA. Cars are racing\nB. Women are running\nC. They happen at the same time", "gt-answer": "A. Cars are racing", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1034736653_1043054206_2": { "order": [ { "question": "In what order do the events occur in the video?\nA. They happen simultaneously\nB. Women running, then cars racing\nC. Cars racing, then women running", "gt-answer": "C. Cars racing, then women running", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. They happen simultaneously\nB. Cars are racing\nC. Women are running", "gt-answer": "B. Cars are racing", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which event happens last in the video?\nA. Cars are racing\nB. They happen at the same time\nC. Women are running", "gt-answer": "C. Women are running", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_0": { "order": [ { "question": "What is the correct chronological order of the events in the video?\nA. A dog is giving a high five to a woman, and then foods are added into a bowl\nB. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman\nC. Foods are added into a bowl, and then a dog is giving a high five to a woman", "gt-answer": "B. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman", "video-llm-prediction": "A. A dog is giving a high five to a woman, and then foods are added into a bowl.", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Foods are added into a bowl\nB. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman\nC. A dog is giving a high five to a woman", "gt-answer": "B. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman", "video-llm-prediction": "A. Foods are added into a bowl", "match_success": true, "rating": 0 }, { "question": "Which event happens second in the video?\nA. A dog is giving a high five to a woman\nB. Foods are added into a bowl\nC. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman", "gt-answer": "C. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_1": { "order": [ { "question": "What is the correct chronological order of the events in the video?\nA. A dog is giving a high five to a woman, and then foods are added into a bowl\nB. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman\nC. Foods are added into a bowl, and then a dog is giving a high five to a woman", "gt-answer": "C. Foods are added into a bowl, and then a dog is giving a high five to a woman", "video-llm-prediction": "A. A dog is giving a high five to a woman, and then foods are added into a bowl.", "match_success": true, "rating": 0 }, { "question": "Which event happens first in the video?\nA. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman\nB. A dog is giving a high five to a woman\nC. Foods are added into a bowl", "gt-answer": "C. Foods are added into a bowl", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which event happens second in the video?\nA. Foods are added into a bowl\nB. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman\nC. A dog is giving a high five to a woman", "gt-answer": "C. A dog is giving a high five to a woman", "video-llm-prediction": "A. Foods are added into a bowl", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_2": { "order": [ { "question": "What is the correct chronological order of the events in the video?\nA. A dog is giving a high five to a woman, and then foods are added into a bowl\nB. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman\nC. Foods are added into a bowl, and then a dog is giving a high five to a woman", "gt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event happens first in the video?\nA. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman\nB. A dog is giving a high five to a woman\nC. Foods are added into a bowl", "gt-answer": "B. A dog is giving a high five to a woman", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "Which event happens second in the video?\nA. A dog is giving a high five to a woman\nB. Foods are added into a bowl\nC. Simultaneously, foods are added into a bowl and a dog is giving a high five to a woman", "gt-answer": "B. Foods are added into a bowl", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1053758117_1055413730_0": { "order": [ { "question": "What is the order of events in the video?\nA. The digital brain is spinning and then the earth is spinning.\nB. Both events occur at the same time\nC. The earth is spinning and then the digital brain is spinning.", "gt-answer": "B. Both events occur at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. The digital brain is spinning.\nB. The events are happening simultaneously\nC. The earth is spinning.", "gt-answer": "B. The events are happening simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs later in the video?\nA. The digital brain is spinning.\nB. The events are happening simultaneously\nC. The earth is spinning.", "gt-answer": "B. The events are happening simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1053758117_1055413730_1": { "order": [ { "question": "What is the order of events in the video?\nA. The earth is spinning and then the digital brain is spinning.\nB. Both events occur at the same time\nC. The digital brain is spinning and then the earth is spinning.", "gt-answer": "C. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. The events are happening simultaneously\nB. The earth is spinning.\nC. The digital brain is spinning.", "gt-answer": "C. The digital brain is spinning.", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which event occurs later in the video?\nA. The events are happening simultaneously\nB. The earth is spinning.\nC. The digital brain is spinning.", "gt-answer": "B. The earth is spinning.", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1053758117_1055413730_2": { "order": [ { "question": "What is the order of events in the video?\nA. Both events occur at the same time\nB. The digital brain is spinning and then the earth is spinning.\nC. The earth is spinning and then the digital brain is spinning.", "gt-answer": "C. The earth is spinning and then the digital brain is spinning.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. The digital brain is spinning.\nB. The earth is spinning.\nC. The events are happening simultaneously", "gt-answer": "B. The earth is spinning.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event occurs later in the video?\nA. The events are happening simultaneously\nB. The earth is spinning.\nC. The digital brain is spinning.", "gt-answer": "C. The digital brain is spinning.", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1076877854_1073914229_0": { "order": [ { "question": "In what order do the events occur in the video?\nA. trains are driving, then robotic arms are working\nB. they happen at the same time\nC. robotic arms are working, then trains are driving", "gt-answer": "B. they happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event happens first in the video?\nA. they happen at the same time\nB. trains are driving\nC. robotic arms are working", "gt-answer": "A. they happen at the same time", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What event happens last in the video?\nA. trains are driving\nB. they happen at the same time\nC. robotic arms are working", "gt-answer": "B. they happen at the same time", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1076877854_1073914229_1": { "order": [ { "question": "In what order do the events occur in the video?\nA. trains are driving, then robotic arms are working\nB. they happen at the same time\nC. robotic arms are working, then trains are driving", "gt-answer": "C. robotic arms are working, then trains are driving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event happens first in the video?\nA. robotic arms are working\nB. they happen at the same time\nC. trains are driving", "gt-answer": "A. robotic arms are working", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What event happens last in the video?\nA. they happen at the same time\nB. trains are driving\nC. robotic arms are working", "gt-answer": "B. trains are driving", "video-llm-prediction": "C", "match_success": true, "rating": 0 } ] }, "1076877854_1073914229_2": { "order": [ { "question": "In what order do the events occur in the video?\nA. robotic arms are working, then trains are driving\nB. trains are driving, then robotic arms are working\nC. they happen at the same time", "gt-answer": "B. trains are driving, then robotic arms are working", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event happens first in the video?\nA. robotic arms are working\nB. trains are driving\nC. they happen at the same time", "gt-answer": "B. trains are driving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What event happens last in the video?\nA. robotic arms are working\nB. they happen at the same time\nC. trains are driving", "gt-answer": "A. robotic arms are working", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1067268406_1067427023_0": { "order": [ { "question": "What is the order of events in the video?\nA. snow particles are melting, then a white car is driving\nB. a white car is driving while snow particles are melting simultaneously\nC. a white car is driving, then snow particles are melting", "gt-answer": "B. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. a white car is driving\nB. a white car is driving while snow particles are melting simultaneously\nC. snow particles are melting", "gt-answer": "B. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening second in the video?\nA. a white car is driving while snow particles are melting simultaneously\nB. a white car is driving\nC. snow particles are melting", "gt-answer": "A. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1067268406_1067427023_1": { "order": [ { "question": "What is the order of events in the video?\nA. a white car is driving, then snow particles are melting\nB. snow particles are melting, then a white car is driving\nC. a white car is driving while snow particles are melting simultaneously", "gt-answer": "A. a white car is driving, then snow particles are melting", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening first in the video?\nA. snow particles are melting\nB. a white car is driving while snow particles are melting simultaneously\nC. a white car is driving", "gt-answer": "C. a white car is driving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening second in the video?\nA. a white car is driving\nB. a white car is driving while snow particles are melting simultaneously\nC. snow particles are melting", "gt-answer": "C. snow particles are melting", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1067268406_1067427023_2": { "order": [ { "question": "What is the order of events in the video?\nA. a white car is driving while snow particles are melting simultaneously\nB. snow particles are melting, then a white car is driving\nC. a white car is driving, then snow particles are melting", "gt-answer": "B. snow particles are melting, then a white car is driving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening first in the video?\nA. a white car is driving while snow particles are melting simultaneously\nB. snow particles are melting\nC. a white car is driving", "gt-answer": "B. snow particles are melting", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is happening second in the video?\nA. a white car is driving\nB. snow particles are melting\nC. a white car is driving while snow particles are melting simultaneously", "gt-answer": "A. a white car is driving", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1086286649": { "action": [ { "question": "What are the armored vehicles doing in the video?\nA. Loading People\nB. Parked\nC. Driving\nD. Firing", "gt-answer": "C. Driving", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the armored vehicles moving?\nA. Driving\nB. Bouncing\nC. Standing still\nD. Hovering", "gt-answer": "A. Driving", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the main action performed by the armored vehicles?\nA. Firing\nB. Loading People\nC. Driving\nD. Under Repair", "gt-answer": "C. Driving", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Which way are the armored vehicles moving from the camera's point of view?\nA. Stationary\nB. Right to left\nC. Left to right", "gt-answer": "B. Right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Towards which direction are the armored vehicles approaching?\nA. The right side of screen\nB. The upper side of screen\nC. The lower side of screen\nD. The left side of screen", "gt-answer": "D. The left side of screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How are the armored vehicles proceeding?\nA. From bottom to top\nB. From top to bottom\nC. From left to right\nD. From right to left", "gt-answer": "D. From right to left", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ], "speed": [ { "question": "How are the armored vehicles moving?\nA. Stationary\nB. Rapidly\nC. Slowly", "gt-answer": "C. Slowly", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the pace of the armored vehicles?\nA. Fast\nB. Slow\nC. Stationary", "gt-answer": "B. Slow", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "In terms of speed, how would you describe the movement of the armored vehicles?\nA. Slowly\nB. Stationary\nC. Quickly", "gt-answer": "A. Slowly", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1093041749": { "action": [ { "question": "What is the dragon doing in the video?\nA. flying\nB. swimming\nC. breathing fire", "gt-answer": "C. breathing fire", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action can the dragon perform?\nA. breathing fire\nB. eating food\nC. laying eggs", "gt-answer": "A. breathing fire", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity does the dragon engage in?\nA. eating food\nB. breathing fire\nC. laying eggs", "gt-answer": "B. breathing fire", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events performed by the dragon?\nA. flying to the sky and then breathing fire\nB. landing from the sky and then breathing fire\nC. breathing fire and then flying to the sky\nD. breathing fire and then landing from the sky", "gt-answer": "B. landing from the sky and then breathing fire", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the first action that the dragon performs?\nA. landing from the sky\nB. breathing fire\nC. eating food\nD. laying eggs", "gt-answer": "A. landing from the sky", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the second event that the dragon performs?\nA. breathing fire\nB. eating food\nC. landing from the sky\nD. laying eggs", "gt-answer": "A. breathing fire", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1076180768": { "action": [ { "question": "What is the knight doing in the video?\nA. riding a horse\nB. wielding a spear\nC. drawing sword from sheath\nD. shooting an arrow", "gt-answer": "C. drawing sword from sheath", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the knight performing?\nA. drawing sword from sheath\nB. shooting an arrow\nC. raising a shield\nD. putting on armor", "gt-answer": "A. drawing sword from sheath", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the knight demonstrating?\nA. putting on armor\nB. casting a spell\nC. drawing sword from sheath\nD. shooting a bow and arrow", "gt-answer": "C. drawing sword from sheath", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "3406661033": { "action": [ { "question": "What is the man doing in the video?\nA. propelling himself forward in wheelchair\nB. swimming\nC. walking", "gt-answer": "A. propelling himself forward in wheelchair", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which action is the man performing?\nA. running\nB. propelling himself forward in wheelchair\nC. jumping", "gt-answer": "B. propelling himself forward in wheelchair", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "How is the man moving?\nA. running\nB. propelling himself forward in wheelchair\nC. crawling", "gt-answer": "B. propelling himself forward in wheelchair", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events in the video?\nA. The man hands the document to colleagues and then stands up from the wheelchair\nB. The man propels himself forward in wheelchair and then hands the document to colleagues.\nC. The man hands the document to colleagues and then propels himself forward in wheelchair.\nD. The man stands up from the wheelchair and then hands the document to colleagues", "gt-answer": "B. The man propels himself forward in wheelchair and then hands the document to colleagues.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which order did the man perform the actions?\nA. He stands up from the wheelchair and then hands the document to colleagues\nB. He propelled himself forward in wheelchair and then handed the document to colleagues.\nC. He hands the document to colleagues and then stands up from the wheelchair\nD. He handed the document to colleagues and then propelled himself forward in wheelchair.", "gt-answer": "B. He propelled himself forward in wheelchair and then handed the document to colleagues.", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action did the man perform first?\nA. Standing up from wheelchair\nB. Sitting down onto wheelchair\nC. Propelling himself forward in wheelchair\nD. Handing the document to colleagues", "gt-answer": "C. Propelling himself forward in wheelchair", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "3406618583": { "action": [ { "question": "What type of dance is the woman performing?\nA. hip-hop\nB. salsa\nC. ballet\nD. freestyle dance", "gt-answer": "D. freestyle dance", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which activity is the woman engaged in?\nA. ballet\nB. freestyle dance\nC. hip-hop\nD. jazz dance", "gt-answer": "B. freestyle dance", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the woman demonstrating?\nA. freestyle dance\nB. hip-hop\nC. jazz dance\nD. ballet", "gt-answer": "A. freestyle dance", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What is the direction of the camera movement in the video?\nA. panning left and right around the girl\nB. panning up and down around the girl\nC. rotating clockwise around the girl\nD. zooming in and out around the girl", "gt-answer": "B. panning up and down around the girl", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How is the camera moving in the video?\nA. panning up and down around the girl\nB. rotating counterclockwise around the girl\nC. staying still\nD. panning left and right around the girl", "gt-answer": "A. panning up and down around the girl", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which way is the camera moving around the girl in the video?\nA. panning left and right\nB. zooming in and out\nC. rotating clockwise\nD. panning up and down", "gt-answer": "D. panning up and down", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3405120819": { "action": [ { "question": "What is the chef doing?\nA. cutting dough\nB. shaping dough\nC. placing dough in a dish", "gt-answer": "B. shaping dough", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is the chef performing?\nA. shaping dough\nB. mixing dough with water\nC. cutting dough", "gt-answer": "A. shaping dough", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which activity is the chef engaging in?\nA. shaping dough\nB. baking dough\nC. cutting dough", "gt-answer": "A. shaping dough", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "In what order does the chef perform the actions?\nA. cutting dough and then shaping dough\nB. smiling at the camera and then shaping dough\nC. shaping dough and then smiling at the camera\nD. shaping dough and then cutting dough", "gt-answer": "C. shaping dough and then smiling at the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the chef doing first in the video?\nA. shaping dough\nB. tossing the dough in the air\nC. smiling at the camera\nD. cutting dough", "gt-answer": "A. shaping dough", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening in the second part of the video?\nA. the chef is smiling at the camera\nB. the chef is shaping dough\nC. the chef is tossing the dough in the air\nD. the chef is cutting dough", "gt-answer": "A. the chef is smiling at the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "3405088753": { "action": [ { "question": "What is the woman doing in the video?\nA. cooking soup\nB. eating apple\nC. buying bread\nD. sleeping", "gt-answer": "C. buying bread", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the woman performing in the video?\nA. reading a book\nB. dancing\nC. buying bread\nD. working out", "gt-answer": "C. buying bread", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in?\nA. buying bread\nB. swimming\nC. painting\nD. gardening", "gt-answer": "A. buying bread", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "In what order do the events occur involving the salesman?\nA. They happen at the same time\nB. packing up the bread for the woman and then saying something to the woman\nC. saying something to the woman and then packing up the bread for the woman", "gt-answer": "B. packing up the bread for the woman and then saying something to the woman", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What is the first event in the video involving the salesman?\nA. packing up the bread for the woman\nB. saying something to the woman\nC. baking bread", "gt-answer": "A. packing up the bread for the woman", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the last event in the video involving the salesman?\nA. baking bread\nB. packing up the bread for the woman\nC. saying something to the woman", "gt-answer": "C. saying something to the woman", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "3401191309": { "action": [ { "question": "What is the athletic man doing in the video?\nA. putting on prosthetic running blade\nB. taking off prosthetic running blade\nC. repairing a prosthetic running blade", "gt-answer": "B. taking off prosthetic running blade", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which activity is the athletic man engaged in?\nA. taking off prosthetic running blade\nB. putting on prosthetic running blade\nC. repairing a prosthetic running blade", "gt-answer": "A. taking off prosthetic running blade", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is the athletic man performing?\nA. taking off prosthetic running blade\nB. repairing a prosthetic running blade\nC. putting on prosthetic running blade", "gt-answer": "A. taking off prosthetic running blade", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "21218935": { "action": [ { "question": "What is the woman doing?\nA. exercising\nB. cooking\nC. sleeping", "gt-answer": "A. exercising", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which activity is the woman engaged in?\nA. reading\nB. dancing\nC. exercising", "gt-answer": "C. exercising", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In the video, what action is the woman performing?\nA. exercising\nB. walking\nC. painting", "gt-answer": "A. exercising", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ], "order": [ { "question": "What is the order of events for the woman?\nA. doing push ups and then smiling at the camera\nB. doing push ups and then frowning at the camera\nC. smiling at the camera and then doing push ups\nD. crying at the camera and then doing push ups", "gt-answer": "A. doing push ups and then smiling at the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In which order does the woman perform the actions?\nA. doing push ups and then smiling at the camera\nB. doing push ups and then frowning at the camera\nC. crying at the camera and then doing push ups\nD. smiling at the camera and then doing push ups", "gt-answer": "A. doing push ups and then smiling at the camera", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the arrangement of events for the woman?\nA. crying at the camera and then doing push ups\nB. doing push ups and then frowning at the camera\nC. doing push ups and then smiling at the camera\nD. smiling at the camera and then doing push ups", "gt-answer": "C. doing push ups and then smiling at the camera", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "5395244": { "action": [ { "question": "What is the woman doing near the creek?\nA. canoeing across the pebble creek\nB. swimming across the pebble creek\nC. running across the pebble creek\nD. walking across the pebble creek", "gt-answer": "D. walking across the pebble creek", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "How is the woman interacting with the creek?\nA. swimming across it\nB. canoeing across it\nC. walking across it\nD. jumping over it", "gt-answer": "C. walking across it", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in at the moment?\nA. walking across the pebble creek\nB. canoeing across the pebble creek\nC. running across the pebble creek\nD. swimming across the pebble creek", "gt-answer": "A. walking across the pebble creek", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1037628617": { "action": [ { "question": "What is the person doing?\nA. Pressing a keyboard key and rotating a jog dial\nB. clicking button and rolling wheel on a mouse\nC. Tapping a touchpad and scrolling with two fingers", "gt-answer": "B. clicking button and rolling wheel on a mouse", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the person's action in the video?\nA. Tapping a touchpad and scrolling with two fingers\nB. Pressing a keyboard key and rotating a jog dial\nC. clicking button and rolling wheel on a mouse", "gt-answer": "C. clicking button and rolling wheel on a mouse", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what is the person engaged in?\nA. Pressing a keyboard key and rotating a jog dial\nB. clicking button and rolling wheel on a mouse\nC. Tapping a touchpad and scrolling with two fingers", "gt-answer": "B. clicking button and rolling wheel on a mouse", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1066801717": { "action": [ { "question": "What is the woman doing in the video?\nA. watering bouquet of daffodils\nB. arranging bouquet of daffodils\nC. cutting bouquet of daffodils", "gt-answer": "B. arranging bouquet of daffodils", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action is being performed by the woman?\nA. cutting bouquet of daffodils\nB. arranging bouquet of daffodils\nC. watering bouquet of daffodils", "gt-answer": "B. arranging bouquet of daffodils", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity can be seen in the video involving the woman?\nA. arranging bouquet of daffodils\nB. watering bouquet of daffodils\nC. cutting bouquet of daffodils", "gt-answer": "A. arranging bouquet of daffodils", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1088428381": { "action": [ { "question": "What is the woman doing in the video?\nA. storing items in a gift box\nB. opening a gift box\nC. wrapping a gift box\nD. delivering a gift box", "gt-answer": "B. opening a gift box", "video-llm-prediction": "C", "match_success": true, "rating": 0 }, { "question": "What action is the woman performing?\nA. wrapping a gift box\nB. delivering a gift box\nC. opening a gift box\nD. storing items in a gift box", "gt-answer": "C. opening a gift box", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what action can be observed from the woman?\nA. storing items in a gift box\nB. delivering a gift box\nC. wrapping a gift box\nD. opening a gift box", "gt-answer": "D. opening a gift box", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1069593640": { "action": [ { "question": "What is the woman doing in the video?\nA. drying hair with a towel\nB. washing face with a towel\nC. putting a towel on her neck", "gt-answer": "C. putting a towel on her neck", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is being performed by the woman?\nA. putting a towel on her neck\nB. drying hair with a towel\nC. washing face with a towel", "gt-answer": "A. putting a towel on her neck", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which of the following actions is shown in the video?\nA. putting a towel on her neck\nB. drying hair with a towel\nC. washing face with a towel", "gt-answer": "A. putting a towel on her neck", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "8307961": { "order": [ { "question": "What is the correct order of actions performed by the man?\nA. Walking and simultaneously showing something on his tablet to a woman\nB. Chatting with a woman while walking and then showing something on his tablet to a woman\nC. Showing something on his tablet to a woman and then chatting with a woman while walking", "gt-answer": "B. Chatting with a woman while walking and then showing something on his tablet to a woman", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video?\nA. Chatting with a woman while walking and then showing something on his tablet to a woman\nB. Walking and simultaneously showing something on his tablet to a woman\nC. Showing something on his tablet to a woman and then chatting with a woman while walking", "gt-answer": "A. Chatting with a woman while walking and then showing something on his tablet to a woman", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is happening first in the video?\nA. Chatting with a woman while walking\nB. Showing something on his tablet to a woman\nC. They happen at the same time", "gt-answer": "A. Chatting with a woman while walking", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "15439453": { "action": [ { "question": "What activities are being performed simultaneously in the video?\nA. Tango dancing and playing piano\nB. Ballet dancing and playing saxophone\nC. Tango dancing and playing violin\nD. Tango dancing and playing saxophone", "gt-answer": "D. Tango dancing and playing saxophone", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which two actions are depicted in the video?\nA. Tango dancing and playing piano\nB. Tango dancing and playing saxophone\nC. Ballet dancing and playing saxophone\nD. Tango dancing and playing violin", "gt-answer": "B. Tango dancing and playing saxophone", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Who is playing saxophone in the video?\nA. A boy\nB. A couple\nC. A girl", "gt-answer": "C. A girl", "video-llm-prediction": "A. A boy", "match_success": true, "rating": 0 } ] }, "1107947873": { "action": [ { "question": "What is the doctor doing in the scenario?\nA. writing a prescription\nB. giving medicine to a patient\nC. performing a surgery", "gt-answer": "B. giving medicine to a patient", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the primary role of the doctor in the scene?\nA. giving medicine to a patient\nB. checking vitals\nC. greeting patients", "gt-answer": "A. giving medicine to a patient", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which activity can be seen in the video involving the doctor?\nA. writing a prescription\nB. giving medicine to a patient\nC. performing a surgery", "gt-answer": "B. giving medicine to a patient", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1081194848": { "action": [ { "question": "What is the researcher doing in the video?\nA. teaching children how to cook a frog\nB. teaching children how to feed a frog\nC. teaching children how to dissect a frog\nD. teaching children how to catch a frog", "gt-answer": "C. teaching children how to dissect a frog", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity are the people engaged in?\nA. dissect a frog\nB. feed a frog\nC. cook a frog\nD. catch a frog", "gt-answer": "A. dissect a frog", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What task is the researcher performing with the children?\nA. cook a frog\nB. dissect a frog\nC. feed a frog\nD. catch a frog", "gt-answer": "B. dissect a frog", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1091526823": { "action": [ { "question": "What is happening to the hand in the video?\nA. opening a book\nB. writing on a book\nC. turning over pages of a book\nD. closing a book", "gt-answer": "C. turning over pages of a book", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is the hand performing?\nA. opening a book\nB. writing on a book\nC. closing a book\nD. turning over pages of a book", "gt-answer": "D. turning over pages of a book", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the hand doing?\nA. opening a book\nB. writing on a book\nC. closing a book\nD. turning over pages of a book", "gt-answer": "D. turning over pages of a book", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "26631100": { "order": [ { "question": "What is the order of events in the video?\nA. One hand is holding the clay pot, then three hands are holding the clay pot\nB. Three hands are holding the clay pot, then two hands are holding the clay pot\nC. Two hands are holding the clay pot, then three hands are holding the clay pot", "gt-answer": "B. Three hands are holding the clay pot, then two hands are holding the clay pot", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What happens first in the video?\nA. Three hands are holding the clay pot\nB. One hand is holding the clay pot\nC. Two hands are holding the clay pot", "gt-answer": "A. Three hands are holding the clay pot", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What happens last in the video?\nA. Two hands are holding the clay pot\nB. One hand is holding the clay pot\nC. Three hands are holding the clay pot", "gt-answer": "A. Two hands are holding the clay pot", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1104663381": { "action": [ { "question": "What is the man doing in the video?\nA. cutting a pizza dough\nB. stretching a pizza dough\nC. folding a pizza dough", "gt-answer": "B. stretching a pizza dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity is the man engaged in while being filmed?\nA. cutting a pizza dough\nB. stretching a pizza dough\nC. folding a pizza dough", "gt-answer": "B. stretching a pizza dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What is the man's action depicted in the video?\nA. cutting a pizza dough\nB. stretching a pizza dough\nC. folding a pizza dough", "gt-answer": "B. stretching a pizza dough", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "direction": [ { "question": "What is the direction in which the pizza dough is rotating?\nA. counter-clockwise\nB. clockwise\nC. it is not rotating", "gt-answer": "A. counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what direction is the pizza dough moving?\nA. flipping up and down\nB. rotating clockwise\nC. rotating counter-clockwise\nD. flipping left and right", "gt-answer": "C. rotating counter-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the rotational direction of the pizza dough?\nA. clockwise\nB. stationary\nC. anti-clockwise", "gt-answer": "C. anti-clockwise", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "22100041": { "action": [ { "question": "What is the woman doing in the video?\nA. waving goodbye\nB. clapping her hands\nC. doing an invitation gesture\nD. pointing towards something", "gt-answer": "C. doing an invitation gesture", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action is the woman performing?\nA. waving goodbye\nB. pointing towards something\nC. clapping her hands\nD. doing an invitation gesture", "gt-answer": "D. doing an invitation gesture", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "When captured on video, what action is the woman engaged in?\nA. waving goodbye\nB. doing an invitation gesture\nC. pointing towards something\nD. clapping her hands", "gt-answer": "B. doing an invitation gesture", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1103623921": { "action": [ { "question": "What is the man doing in the video?\nA. playing pool\nB. playing football\nC. cooking", "gt-answer": "A. playing pool", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What activity is the man engaged in?\nA. sleeping\nB. dancing\nC. playing pool", "gt-answer": "C. playing pool", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action is the man performing?\nA. swimming\nB. playing pool\nC. reading books", "gt-answer": "B. playing pool", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ], "speed": [ { "question": "What is the speed that the video is palying?\nA. slow-motion\nB. fast-forward\nC. normal speed\nD. stopped", "gt-answer": "C. normal speed", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How would you describe the speed at which the video is playing?\nA. Slowly\nB. Normally\nC. Rapidly", "gt-answer": "B. Normally", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What playback rate is the video currently at?\nA. Slow motion\nB. Paused\nC. Normal pace\nD. Fast-forwarded", "gt-answer": "C. Normal pace", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1093338031": { "action": [ { "question": "What is the man attempting to do?\nA. click a computer screen\nB. fix a computer screen\nC. clean a computer screen\nD. punch a computer screen", "gt-answer": "D. punch a computer screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action is the man trying to perform?\nA. fix a computer screen\nB. clean a computer screen\nC. click a computer screen\nD. punch a computer screen", "gt-answer": "D. punch a computer screen", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the man's activity in the video?\nA. Attempting to punch a computer screen\nB. Attempting to fix a computer screen\nC. Attempting to clean a computer screen\nD. Attempting to click a computer screen", "gt-answer": "A. Attempting to punch a computer screen", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1064310466": { "action": [ { "question": "What is the man doing?\nA. watering cocoa seeds\nB. planting cocoa seeds\nC. baking cocoa seeds\nD. peeling cocoa seeds", "gt-answer": "D. peeling cocoa seeds", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which activity is the man involved in?\nA. baking cocoa seeds\nB. watering cocoa seeds\nC. peeling cocoa seeds\nD. planting cocoa seeds", "gt-answer": "C. peeling cocoa seeds", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the man performing?\nA. planting cocoa seeds\nB. watering cocoa seeds\nC. baking cocoa seeds\nD. peeling cocoa seeds", "gt-answer": "D. peeling cocoa seeds", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "1088497853": { "direction": [ { "question": "What is the direction of the movement in the video?\nA. leftwards\nB. upwards\nC. rightwards\nD. downwards", "gt-answer": "B. upwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which direction is the camera moving before the stone building?\nA. rightwards\nB. upwards\nC. leftwards\nD. downwards", "gt-answer": "B. upwards", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the trajectory of the camera movement in the video?\nA. flying downwards\nB. flying rightwards\nC. flying upwards\nD. flying leftwards", "gt-answer": "C. flying upwards", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1106087175": { "action": [ { "question": "What is the man doing in the video?\nA. wearing a white sneaker\nB. drawing on a white sneaker\nC. taking off a white sneaker\nD. tying shoelaces on a white sneaker", "gt-answer": "B. drawing on a white sneaker", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity is the man engaged in?\nA. drawing on a white sneaker\nB. taking off a white sneaker\nC. tying shoelaces on a white sneaker\nD. wearing a white sneaker", "gt-answer": "A. drawing on a white sneaker", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which action can be observed in the video?\nA. drawing on a white sneaker\nB. taking off a white sneaker\nC. wearing a white sneaker\nD. tying shoelaces on a white sneaker", "gt-answer": "A. drawing on a white sneaker", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "13324343": { "order": [ { "question": "What is the order of events in the video?\nA. Man gliding on the skateboard and then tying his shoelaces\nB. Man tying his shoelaces and then gliding on the skateboard\nC. Man gliding on the skateboard and then jumping\nD. Man jumping and then tying his shoelaces", "gt-answer": "B. Man tying his shoelaces and then gliding on the skateboard", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In which sequence does the man perform the actions?\nA. gliding on the skateboard and then jumping\nB. jumping and then tying his shoelaces\nC. tying his shoelaces and then gliding on the skateboard\nD. gliding on the skateboard and then tying his shoelaces", "gt-answer": "C. tying his shoelaces and then gliding on the skateboard", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the correct order of actions by the man?\nA. gliding on the skateboard and then tying his shoelaces\nB. tying his shoelaces and then gliding on the skateboard\nC. jumping and then tying his shoelaces\nD. gliding on the skateboard and then jumping", "gt-answer": "B. tying his shoelaces and then gliding on the skateboard", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1083624811": { "action": [ { "question": "What is the woman doing in the exercise?\nA. performing push-ups\nB. performing alternating leg lift plank\nC. performing a traditional plank hold\nD. performing side plank variations", "gt-answer": "B. performing alternating leg lift plank", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action is the woman carrying out?\nA. performing side plank variations\nB. performing a traditional plank hold\nC. performing alternating leg lift plank\nD. performing push-ups", "gt-answer": "C. performing alternating leg lift plank", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity is the woman engaged in?\nA. performing alternating leg lift plank\nB. performing push-ups\nC. performing a traditional plank hold\nD. performing side plank variations", "gt-answer": "A. performing alternating leg lift plank", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1014976360": { "order": [ { "question": "What is the order of events for the man?\nA. putting on his glasses and then looking at his phone\nB. taking off his glasses and then looking at his phone\nC. looking at his phone and then putting on his glasses\nD. looking at his phone and then taking off his glasses", "gt-answer": "D. looking at his phone and then taking off his glasses", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which event does the man do first?\nA. looking at his phone\nB. taking off his glasses\nC. putting on his glasses", "gt-answer": "A. looking at his phone", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event does the man do second?\nA. taking off his glasses\nB. putting on his glasses\nC. looking at his phone", "gt-answer": "A. taking off his glasses", "video-llm-prediction": "B", "match_success": true, "rating": 0 } ] }, "18416608": { "order": [ { "question": "In which order does the woman perform the actions?\nA. operating her tablet first, then sampling water in a bottle\nB. the actions are performed simultaneously\nC. sampling water in a bottle first, then operating her tablet", "gt-answer": "C. sampling water in a bottle first, then operating her tablet", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the first action that the woman does?\nA. sampling water in a bottle\nB. the actions are performed simultaneously\nC. operating her tablet", "gt-answer": "A. sampling water in a bottle", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the second action that the woman does?\nA. sampling water in a bottle\nB. the actions are performed simultaneously\nC. operating her tablet", "gt-answer": "C. operating her tablet", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1061351290": { "order": [ { "question": "What is the order of events in the video involving the woman?\nA. measuring her belly with a measuring tape and then touching her pregnant belly\nB. touching her pregnant belly and then taking a nap\nC. taking a nap and then measuring her belly with a measuring tape\nD. touching her pregnant belly and then measuring her belly with a measuring tape", "gt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What sequence of actions does the woman follow in the video?\nA. measuring her belly with a measuring tape and then touching her pregnant belly\nB. taking off clothes then measuring her belly with a measuring tape\nC. touching her pregnant belly and then taking off clothes\nD. touching her pregnant belly and then measuring her belly with a measuring tape", "gt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In what order does the woman perform the actions in the video?\nA. taking off clothes then measuring her belly with a measuring tape\nB. touching her pregnant belly and then measuring her belly with a measuring tape\nC. measuring her belly with a measuring tape and then touching her pregnant belly\nD. touching her pregnant belly and then taking off clothes", "gt-answer": "B. touching her pregnant belly and then measuring her belly with a measuring tape", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1066238617": { "action": [ { "question": "What is the woman doing?\nA. dancing\nB. practising her punches\nC. cooking", "gt-answer": "B. practising her punches", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity is the woman engaged in?\nA. singing\nB. practising her punches\nC. swimming", "gt-answer": "B. practising her punches", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which action is the woman performing?\nA. playing chess\nB. practising her punches\nC. writing", "gt-answer": "B. practising her punches", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1072000366": { "action": [ { "question": "What are the girls doing to each other?\nA. elbowing each other\nB. giving high five to each other\nC. waving at each other\nD. shaking hands", "gt-answer": "A. elbowing each other", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which action are the girls engaged in?\nA. waving at each other\nB. shaking hands\nC. giving high five to each other\nD. elbowing each other", "gt-answer": "D. elbowing each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity are the girls involved in?\nA. waving at each other\nB. shaking hands\nC. giving high five to each other\nD. elbowing each other", "gt-answer": "D. elbowing each other", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1065272113": { "action": [ { "question": "What is the doctor doing to the woman?\nA. taking her blood pressure\nB. checking her temperature\nC. giving her an injection", "gt-answer": "C. giving her an injection", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the doctor performing on the woman?\nA. applying bandage\nB. writing a prescription\nC. giving an injection", "gt-answer": "C. giving an injection", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the doctor engaged in?\nA. writing a prescription\nB. giving an injection\nC. applying bandage", "gt-answer": "B. giving an injection", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1072971926": { "action": [ { "question": "What is the man doing with the pizza box?\nA. opening the pizza box\nB. wrapping the pizza box\nC. eating the pizza\nD. closing the pizza box", "gt-answer": "A. opening the pizza box", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action is being performed by the man?\nA. closing the pizza box\nB. eating the pizza\nC. wrapping the pizza box\nD. opening the pizza box", "gt-answer": "D. opening the pizza box", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the man engaged in?\nA. opening the pizza box\nB. eating the pizza\nC. wrapping the pizza box\nD. closing the pizza box", "gt-answer": "A. opening the pizza box", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "3399348431": { "action": [ { "question": "What is the person doing with the sauce?\nA. mixing it with the vegetables\nB. squeezing it into a bowl of vegetables\nC. dipping vegetables in it", "gt-answer": "B. squeezing it into a bowl of vegetables", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the video showing?\nA. dipping vegetables on the sauce\nB. squeezing the sauce into a bowl of vegetables\nC. mixing sauce with the vegetables", "gt-answer": "B. squeezing the sauce into a bowl of vegetables", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is being performed with the sauce?\nA. squeezing it into a bowl of vegetables\nB. dipping vegetables in it\nC. mixing it with the vegetables", "gt-answer": "A. squeezing it into a bowl of vegetables", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1025137214": { "action": [ { "question": "What is the man doing?\nA. walking\nB. smoking cigarette\nC. talking on the phone", "gt-answer": "B. smoking cigarette", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What action is the man engaged in?\nA. reading a book\nB. smoking cigarette\nC. writing a letter", "gt-answer": "B. smoking cigarette", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which activity is the man involved in?\nA. playing soccer\nB. smoking cigarette\nC. cooking a meal", "gt-answer": "B. smoking cigarette", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1033101626": { "action": [ { "question": "What is the man doing?\nA. cooking\nB. singing\nC. playing instrument", "gt-answer": "C. playing instrument", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the man engaged in?\nA. dancing\nB. reading\nC. playing instrument", "gt-answer": "C. playing instrument", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which action is the man performing?\nA. walking\nB. sleeping\nC. playing instrument", "gt-answer": "C. playing instrument", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "9537677": { "action": [ { "question": "What activity is the woman engaged in?\nA. reading a book\nB. watching TV\nC. playing tablet\nD. cooking", "gt-answer": "C. playing tablet", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the woman's action in the video?\nA. playing tablet\nB. dancing\nC. painting\nD. driving", "gt-answer": "A. playing tablet", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the main focus of the woman's attention?\nA. listening to music\nB. playing tablet\nC. talking on the phone\nD. cooking", "gt-answer": "B. playing tablet", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1077388994": { "action": [ { "question": "What action is the woman performing?\nA. singing\nB. dancing\nC. patting the baby", "gt-answer": "C. patting the baby", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the woman engaged in?\nA. cooking dinner\nB. gardening\nC. patting the baby", "gt-answer": "C. patting the baby", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which of the following is the woman doing?\nA. writing a letter\nB. reading a book\nC. patting the baby", "gt-answer": "C. patting the baby", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1037531786": { "action": [ { "question": "What are the two men doing in the video?\nA. dancing\nB. cooking\nC. boxing\nD. painting", "gt-answer": "C. boxing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which physical activity are the two men engaged in?\nA. swimming\nB. running\nC. boxing\nD. cycling", "gt-answer": "C. boxing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What sport are the two men participating in?\nA. basketball\nB. football\nC. boxing\nD. tennis", "gt-answer": "C. boxing", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1077275024": { "action": [ { "question": "What is the girl doing in the video?\nA. Jumping with a man playing ukulele\nB. Dancing with a man playing ukulele\nC. Clapping hands for a man playing ukulele", "gt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What activity is the girl engaged in?\nA. Sitting and watching a man play the ukulele\nB. Playing the ukulele alongside the man\nC. Clapping hands for a man playing ukulele", "gt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the girl performing?\nA. Recording the man playing the ukulele\nB. Dancing with a man playing ukulele\nC. Clapping hands for a man playing ukulele", "gt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1107180099": { "action": [ { "question": "What are the women doing?\nA. singing\nB. painting\nC. dancing\nD. cooking", "gt-answer": "C. dancing", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which activity are the women engaged in?\nA. swimming\nB. playing basketball\nC. dancing\nD. gardening", "gt-answer": "C. dancing", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the primary action of the group of women?\nA. playing football\nB. dancing\nC. reading\nD. skiing", "gt-answer": "B. dancing", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1049434159": { "action": [ { "question": "What are the parents and daughter doing together?\nA. cooking dinner\nB. playing video games\nC. reading a book", "gt-answer": "B. playing video games", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What activity are the parents and daughter engaged in?\nA. hiking\nB. playing video games\nC. dancing", "gt-answer": "B. playing video games", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which of the following actions are the parents and daughter involved in?\nA. painting\nB. playing video games\nC. gardening", "gt-answer": "B. playing video games", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "3402234027": { "action": [ { "question": "What is the cat doing in the video?\nA. sleeping\nB. playing with a toy\nC. eating food", "gt-answer": "C. eating food", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which activity is the cat engaged in?\nA. swimming\nB. climbing a tree\nC. eating food", "gt-answer": "C. eating food", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the cat performing?\nA. running on the ground\nB. sitting on a chair\nC. eating food on the ground", "gt-answer": "C. eating food on the ground", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1056491306": { "action": [ { "question": "What are the passengers doing on the subway?\nA. sleeping on the bed\nB. standing in a room\nC. taking a seat on subway\nD. dancing on the stage", "gt-answer": "C. taking a seat on subway", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity are the passengers engaged in while on the subway train?\nA. talking\nB. reading\nC. taking a seat\nD. eating", "gt-answer": "C. taking a seat", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which action are the passengers performing inside the subway?\nA. running on a treadmill\nB. walking on the street\nC. taking a seat on subway\nD. jumping on the floor", "gt-answer": "C. taking a seat on subway", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1012085909": { "action": [ { "question": "What are the people doing in the video?\nA. rolling boats on the lake\nB. walking on the street\nC. pushing bikes up a hill", "gt-answer": "C. pushing bikes up a hill", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "How are the people moving?\nA. running\nB. swimming\nC. pushing bikes", "gt-answer": "C. pushing bikes", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What is the main activity of the people?\nA. rollerblading\nB. playing basketball\nC. pushing bikes", "gt-answer": "C. pushing bikes", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1079406734": { "action": [ { "question": "What is the man doing to the car in the video?\nA. riding bikes\nB. taking a shower\nC. washing the car\nD. driving the car", "gt-answer": "C. washing the car", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is being performed by the man?\nA. feeding a dog\nB. reading a book\nC. washing the car\nD. playing the guitar", "gt-answer": "C. washing the car", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In the video, what activity is the man engaged in?\nA. dancing\nB. sleeping\nC. washing the car\nD. cooking", "gt-answer": "C. washing the car", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1022115337": { "order": [ { "question": "What is the order of events?\nA. dancing and then sending an air kiss\nB. sending an air kiss and then dancing\nC. dancing at the same time as sending an air kiss", "gt-answer": "A. dancing and then sending an air kiss", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which event occurs first?\nA. dancing\nB. sending an air kiss\nC.Both events happen at the same time", "gt-answer": "A. dancing", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "Which event occurs second?\nA. dancing\nB. sending an air kiss\nC.Both events happen at the same time", "gt-answer": "B. sending an air kiss", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1071214909": { "action": [ { "question": "What is the person doing on the wood surface?\nA. carving a design\nB. measuring the length\nC. drawing a cutting line\nD. sanding the surface", "gt-answer": "C. drawing a cutting line", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the action performed by the person?\nA. drawing a cuttting line on a wood surface\nB. erasing a line on a wood surface\nC. carving a pattern on a wood surface\nD. measuring length on a wood surface", "gt-answer": "A. drawing a cuttting line on a wood surface", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the video about?\nA. drawing a cuttting line on a wood surface\nB. erasing a line on a wood surface\nC. carving a pattern on a wood surface\nD. measuring length on a wood surface", "gt-answer": "A. drawing a cuttting line on a wood surface", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "1092065543": { "action": [ { "question": "What is the man doing?\nA. eating\nB. shopping\nC. sleeping\nD. running", "gt-answer": "B. shopping", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "Which activity is the man engaged in?\nA. cooking\nB. gardening\nC. shopping\nD. painting", "gt-answer": "C. shopping", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "In the video, what can we see the man doing?\nA. singing\nB. dancing\nC. shopping\nD. playing guitar", "gt-answer": "C. shopping", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1017063703": { "action": [ { "question": "What is the person doing in the video?\nA. baking cakes\nB. decorating cakes\nC. cutting cakes\nD. presenting cakes to guests", "gt-answer": "B. decorating cakes", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What action is demonstrated in the video?\nA. baking cakes\nB. decorating cakes\nC. cutting cakes\nD. presenting cakes to guests", "gt-answer": "B. decorating cakes", "video-llm-prediction": "B", "match_success": true, "rating": 1 }, { "question": "What task is being performed in the footage?\nA. baking cakes\nB. decorating cakes\nC. cutting cakes\nD. presenting cakes to guests", "gt-answer": "B. decorating cakes", "video-llm-prediction": "B", "match_success": true, "rating": 1 } ] }, "1055022287": { "action": [ { "question": "What is the man doing in the video?\nA. cooking\nB. singing\nC. cleaning a swimming pool", "gt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which activity is being performed by the man in the video?\nA. dancing\nB. playing basketball\nC. cleaning a swimming pool", "gt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What action is the man undertaking?\nA. reading\nB. sleeping\nC. cleaning a swimming pool", "gt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1094259081": { "action": [ { "question": "What is the woman doing in the video?\nA. watching VR movie\nB. listening to music using VR\nC. playing VR shooting game\nD. working out using VR", "gt-answer": "C. playing VR shooting game", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is the woman engaged in?\nA. watching VR movie\nB. listening to music using VR\nC. playing VR shooting game\nD. working out using VR", "gt-answer": "C. playing VR shooting game", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "Which activity is the woman participating in?\nA. watching VR movie\nB. listening to music using VR\nC. playing VR shooting game\nD. working out using VR", "gt-answer": "C. playing VR shooting game", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1022260408": { "action": [ { "question": "What is the squirrel doing in the video?\nA. sleeping\nB. running\nC. eating food", "gt-answer": "C. eating food", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "What activity is the squirrel engaged in?\nA. chasing its tail\nB. cleaning itself\nC. eating food", "gt-answer": "C. eating food", "video-llm-prediction": "C", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the squirrel performing?\nA. climbing a tree\nB. swimming in a pond\nC. eating food", "gt-answer": "C. eating food", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1089810969": { "action": [ { "question": "How does the little girl interact with the woman?\nA. she runs towards her and hugs her\nB. she walks towards her and hug her\nC. she runs towards her and jumps on her back\nD. she runs towards her and talks to her", "gt-answer": "A. she runs towards her and hugs her", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What action does the little girl perform?\nA. she runs towards a woman and hugs her\nB. she walks towards a woman and hugs her\nC. she runs towards a woman and jumps on her back\nD. she runs towards a woman and talks to her", "gt-answer": "A. she runs towards a woman and hugs her", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "Which of the following actions is the little girl performing?\nA. she runs towards a woman and hugs her\nB. she walks towards a woman and hugs her\nC. she runs towards a woman and jumps on her back\nD. she runs towards a woman and talks to her", "gt-answer": "A. she runs towards a woman and hugs her", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] }, "6165731": { "action": [ { "question": "What is the scientist doing in the experiment?\nA. observing quietly on the experiment\nB. leisurely conducting experiments\nC. looking confused and frustrated about the experiment", "gt-answer": "C. looking confused and frustrated about the experiment", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "How does the scientist feel about the experiment?\nA. excited and motivated\nB. bored and disinterested\nC. confused and frustrated", "gt-answer": "C. confused and frustrated", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What is the emotional state of the scientist during the experiment?\nA. calm and content\nB. happy and satisfied\nC. confused and frustrated", "gt-answer": "C. confused and frustrated", "video-llm-prediction": "C", "match_success": true, "rating": 1 } ] }, "1111469465": { "action": [ { "question": "What is the man doing in the video?\nA. raising his arm to look at the watch looking happy\nB. raising his arm to look at the watch looking calm\nC. raising his arm to look at the watch looking anxious\nD. putting his hands in his pockets looking anxious", "gt-answer": "C. raising his arm to look at the watch looking anxious", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "What action is being performed by the man?\nA. raising his arm to look at the watch looking happy\nB. raising his arm to look at the watch looking calm\nC. raising his arm to look at the watch looking anxious\nD. putting his hands in his pockets looking anxious", "gt-answer": "C. raising his arm to look at the watch looking anxious", "video-llm-prediction": "A", "match_success": true, "rating": 0 }, { "question": "In the video, what is the man's action?\nA. raising his arm to look at the watch looking happy\nB. raising his arm to look at the watch looking calm\nC. raising his arm to look at the watch looking anxious\nD. putting his hands in his pockets looking anxious", "gt-answer": "C. raising his arm to look at the watch looking anxious", "video-llm-prediction": "A", "match_success": true, "rating": 0 } ] }, "1050000214": { "action": [ { "question": "What action is the little child performing?\nA. Running\nB. Swimming\nC. Water jumping\nD. Dancing", "gt-answer": "C. Water jumping", "video-llm-prediction": "B", "match_success": true, "rating": 0 }, { "question": "What is the little child doing in the video?\nA. Eating\nB. Sleeping\nC. Crying\nD. Water jumping", "gt-answer": "D. Water jumping", "video-llm-prediction": "D", "match_success": true, "rating": 1 }, { "question": "Which action is the little child engaged in?\nA. Reading\nB. Writing\nC. Singing\nD. Water jumping", "gt-answer": "D. Water jumping", "video-llm-prediction": "D", "match_success": true, "rating": 1 } ] }, "27537016": { "order": [ { "question": "What is the sequence of events involving the man?\nA. showing off his car key then pulling back inside the car\nB. pulling back inside the car then showing off his car key\nC. throwing away his car key then pulling back inside the car\nD. pulling back inside the car then throwing away his car key", "gt-answer": "A. showing off his car key then pulling back inside the car", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "What is the correct order of actions performed by the man?\nA. showing off his car key, pulling back inside the car\nB. pulling back inside the car, showing off his car key\nC. throwing away his car key, pulling back inside the car\nD. pulling back inside the car, throwing away his car key", "gt-answer": "A. showing off his car key, pulling back inside the car", "video-llm-prediction": "A", "match_success": true, "rating": 1 }, { "question": "In what order did the man do the activities?\nA. showing off his car key, pulling back inside the car\nB. pulling back inside the car, showing off his car key\nC. throwing away his car key, pulling back inside the car\nD. pulling back inside the car, throwing away his car key", "gt-answer": "A. showing off his car key, pulling back inside the car", "video-llm-prediction": "A", "match_success": true, "rating": 1 } ] } }, "captioning": { "1034419625": { "action": [ { "chatgpt-reasoning": "The video description specifically mentions that the man is dribbling a basketball, dunking a basketball, and passing a basketball.", "chatgpt-answer": "B. dribbling a basketball, C. passing a basketball", "video-llm-prediction": "The video showcases a man dribbling a basketball, dunking a basketball, and passing a basketball. The man is seen moving around the court while performing these actions. The video captures the man's movements and the sound of the ball bouncing on the court. The man's dribbling skills are impressive, and he seems to be in control of the ball at all times. The dunking and passing actions are also executed with precision, and the man's movements are fluid and graceful. Overall, the video is a great display of basketball skills and is sure to impress any basketball", "gt-answer": "A. dunking a basketball", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the man is seen dribbling the basketball, dunking the ball into the basket, and passing the ball to another player. These actions indicate that the man is engaged in playing basketball.", "chatgpt-answer": "B. dribbling a basketball", "video-llm-prediction": "The video showcases a man dribbling, dunking, and passing a basketball. The man is seen dribbling the basketball in a dark room, and then he dunks the ball into the basket. Later, the man is seen passing the ball to another player. The video highlights the man's basketball skills, and the dark room adds a mysterious and dramatic effect to the video.", "gt-answer": "A. dunking a basketball", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the man is dribbling a basketball and then dunking it into the net.", "chatgpt-answer": "B. dribbling a basketball", "video-llm-prediction": "A man dribbles a basketball, then dunks it into the net.", "gt-answer": "A. dunking a basketball", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is dribbling a basketball, passing it to another player, and then dunking it into the basket.", "chatgpt-answer": "C. passing a basketball", "video-llm-prediction": "A man dribbles a basketball, passes it to another player, and then dunks it into the basket.", "gt-answer": "A. dunking a basketball", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description states that the man is first seen moving away from the camera while holding a basketball, and then he moves towards the camera.", "chatgpt-answer": "A. moving towards the camera", "video-llm-prediction": "A man is seen moving away from the camera while holding a basketball. He then moves towards the camera and shoots the basketball into the hoop.", "gt-answer": "B. moving from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is initially moving away from the camera, and then moves towards the camera.", "chatgpt-answer": "C. moving away from the camera", "video-llm-prediction": "A man is seen moving away from the camera while holding a basketball. He then moves towards the camera while still holding the basketball.", "gt-answer": "B. moving from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is moving away from the camera.", "chatgpt-answer": "C. moving away from the camera", "video-llm-prediction": "A man is seen moving away from the camera while holding a basketball.", "gt-answer": "B. moving from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is seen moving away from the camera while holding a basketball. Therefore, the correct answer is C. moving away from the camera.", "chatgpt-answer": "C. moving away from the camera", "video-llm-prediction": "A man is seen moving away from the camera while holding a basketball. He then moves towards the camera and shoots the ball into the basket.", "gt-answer": "B. moving from left to right", "rating": 0 } ] }, "1094590221": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is dribbling a basketball, passing it to another man, and then dunking it into the basket.", "chatgpt-answer": "D. dunking basketball", "video-llm-prediction": "The video shows a man dribbling a basketball, passing it to another man, and then dunking it into the basket. The video captures the man's movements as he performs these actions.", "gt-answer": "C. shooting basketball", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen dribbling a basketball and then passes the ball to another player, who dunks it into the basket. Therefore, the correct answer is:", "chatgpt-answer": "A. dribbling basketball", "video-llm-prediction": "A man is seen dribbling a basketball in a video. He then passes the ball to another player, who dunks it into the basket. The video captures the man's skills in dribbling, passing, and dunking the basketball.", "gt-answer": "C. shooting basketball", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically states that the man is dribbling a basketball on a court. Therefore, the correct answer should be A. dribbling basketball.", "chatgpt-answer": "A. dribbling basketball", "video-llm-prediction": "A man dribbles a basketball on a court during a sunset.", "gt-answer": "C. shooting basketball", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is seen dribbling, passing, and shooting a basketball.", "chatgpt-answer": "A. dribbling basketball", "video-llm-prediction": "A man is seen dribbling, passing, and shooting a basketball in a video.", "gt-answer": "C. shooting basketball", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that the man is seen dribbling the ball and then shooting it into the basket. Based on this information, we can infer that the basketball is moving in the direction that the man is playing, which would be straight ahead.", "chatgpt-answer": "A. straight ahead", "video-llm-prediction": "A man is seen playing basketball in a court. He is seen dribbling the ball and then shooting it into the basket. The video captures the man's movements as he plays basketball.", "gt-answer": "C. right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the ball is seen flying straight ahead and then from left to right.", "chatgpt-answer": "B. left to right", "video-llm-prediction": "A man is seen dribbling a basketball on a court while the sun sets in the background. The ball is seen flying straight ahead and then from left to right.", "gt-answer": "C. right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the basketball player is shooting a basket, but it does not mention anything about the direction of the basketball. Therefore, we cannot determine the direction of the basketball based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A basketball player is seen shooting a basket while the sun sets in the background.", "gt-answer": "C. right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a basketball player shoots a basket. When shooting a basket, the basketball typically moves in a straight-ahead direction towards the hoop.", "chatgpt-answer": "A. straight ahead", "video-llm-prediction": "A basketball player shoots a basket while the sun sets in the background.", "gt-answer": "C. right to left", "rating": 0 } ] }, "1098982673": { "action": [ { "chatgpt-reasoning": "The video description mentions that the two women are singing and dancing while holding a rolling pin and a cookie. They are also shown laughing at the end of the video.", "chatgpt-answer": "B. Dancing and singing", "video-llm-prediction": "Two women are shown in a kitchen, one of them is holding a rolling pin and the other is holding a cookie. They are singing and dancing while holding the objects. The video ends with the two women holding a cookie and laughing.", "gt-answer": "B. Dancing and singing", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that one woman is singing while the other is dancing. There is no mention of eating, sleeping, or running.", "chatgpt-answer": "B. Dancing and singing", "video-llm-prediction": "Two women are seen in a kitchen, one of them is singing while the other is dancing. They are both wearing aprons and are holding a rolling pin. The woman who is singing is also holding a spoon. The woman who is dancing is wearing a pink shirt and is holding a spoon as well. The kitchen is well-lit and has a white color scheme. The women seem to be enjoying themselves as they sing and dance.", "gt-answer": "B. Dancing and singing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that one of the women is singing while the other is dancing. Therefore, the correct answer would be B. Dancing and singing.", "chatgpt-answer": "B. Dancing and singing", "video-llm-prediction": "Two women are seen in a kitchen, one of them is singing while the other is dancing.", "gt-answer": "B. Dancing and singing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the two women are seen dancing and singing while holding a rolling pin. They are also seen eating and singing while holding a knife. This indicates that the women are engaged in both activities simultaneously.", "chatgpt-answer": "B. Dancing and singing", "video-llm-prediction": "Two women are seen in a kitchen, dancing and singing while holding a rolling pin. They are also seen eating and singing while holding a knife.", "gt-answer": "B. Dancing and singing", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the actions and movements of the two women in the kitchen, but does not mention anything about the speed at which these actions occur.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two women are seen standing in a kitchen, one holding a rolling pin and the other holding a bowl. They are speaking to the camera and begin to dance around the kitchen. They continue to dance and sing while holding the objects in their hands. The video ends with the women holding the objects and speaking to the camera.", "gt-answer": "A. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two women are standing in a kitchen, holding a rolling pin and a cookie sheet. They are laughing and talking to the camera. The women then proceed to roll out the dough and place it on the cookie sheet. They then put the cookie sheet in the oven. The women are seen taking the cookie sheet out of the oven and placing it on a plate. They then eat the cookies and laugh.", "gt-answer": "A. normal speed", "rating": 0 }, { "chatgpt-reasoning": "There is no information provided in the video description regarding the speed of the video. Therefore, it is not possible to determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two women are shown in a kitchen, laughing and dancing while holding a rolling pin. They are seen making cookies and dancing around the kitchen.", "gt-answer": "A. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. Therefore, it cannot be determined which choice is correct.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two women are shown in a kitchen, laughing and dancing while holding a rolling pin. They are seen making cookies and dancing around the kitchen.", "gt-answer": "A. normal speed", "rating": 0 } ] }, "1111657885": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that two people are seen ice skating in a gym. There is no mention of skiing or swimming in the description.", "chatgpt-answer": "B. ice skating", "video-llm-prediction": "Two people are seen ice skating in a gym. They are wearing black and white outfits and are holding poles. The gym has a blue wall and a clock on the wall. The video shows the two people skating around the gym while the camera follows them.", "gt-answer": "B. ice skating", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the first scene shows a person skiing on a snowy hill, and the second scene features a group of people ice skating on an indoor rink. Therefore, the people in the video are skiing and ice skating.", "chatgpt-answer": "A. skiing, B. ice skating", "video-llm-prediction": "The video showcases a group of people engaging in various winter sports activities. The first scene shows a person skiing on a snowy hill, while the second scene features a group of people ice skating on an indoor rink. The third scene shows a person swimming in a pool. The video captures the excitement and thrill of winter sports, with the individuals showcasing their skills and enjoying the cold weather.", "gt-answer": "B. ice skating", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that people are skiing on ice.", "chatgpt-answer": "A. skiing", "video-llm-prediction": "People are seen skiing on ice.", "gt-answer": "B. ice skating", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that two people are ice skating in a gym.", "chatgpt-answer": "B. ice skating", "video-llm-prediction": "Two people are seen ice skating in a gym.", "gt-answer": "B. ice skating", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is shot in slow motion. Therefore, the tempo of the video is slow motion.", "chatgpt-answer": "B. slow motion", "video-llm-prediction": "The video shows two people sliding on an ice rink while wearing protective gear. They are seen gliding back and forth while holding onto a rope. The video is shot in slow motion, and the people are seen moving back and forth while holding onto the rope. The video ends with the people stopping and looking at each other.", "gt-answer": "B. slow motion", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention anything about the tempo or speed of the video. Therefore, we cannot determine the tempo based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases two men engaging in the sport of curling on an ice rink. They are seen pushing a puck along the ice, with one man wearing a white shirt and the other wearing a black shirt. The video captures the intense concentration and physical exertion required to play this sport. The sound of the puck gliding along the ice and the crunching of the ice underfoot can be heard in the background. The video also highlights the precision and teamwork required to play curling at a high level. Overall, the video provides a glimpse into", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the video is shot in slow motion.", "chatgpt-answer": "B. slow motion", "video-llm-prediction": "The video shows two people sliding on an ice rink while wearing protective gear. They are seen gliding back and forth while holding onto a rope. The video is shot in slow motion, and the sound of the ice sliding can be heard.", "gt-answer": "B. slow motion", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention any specific information about the tempo of the video. It only provides details about the sport of curling and the actions of the players. Without any indication of the tempo, it is not possible to determine the correct answer.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a group of people engaging in the sport of curling on an ice rink. The players are seen sliding down the ice while holding onto a curling stone, and they are dressed in appropriate attire for the sport. The video captures the players' movements and the sound of the ice being scraped. The video also shows the players taking a break and enjoying a drink. Overall, the video provides a glimpse into the sport of curling and the skills required to play it.", "gt-answer": "B. slow motion", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that some people are skating towards the camera, while others are skating parallel to the screen. Additionally, the video ends with the people skating away from the camera.", "chatgpt-answer": "C. away from the camera", "video-llm-prediction": "The video shows a group of people skating on an indoor rink. Some of them are skating towards the camera while others are skating parallel to the screen. The people are wearing different colored outfits and are skating at different speeds. The rink is well-lit, and there are no spectators visible in the video. The video ends with the people skating away from the camera.", "gt-answer": "A. towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the skaters are moving towards the camera, then parallel to the screen, and finally away from the camera.", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "The video showcases a group of people skating on an indoor rink. The camera captures the skaters as they move towards the camera, creating a sense of movement and excitement. The skaters continue to skate parallel to the screen, showcasing their skills and agility. The video ends with the skaters skating away from the camera, leaving the viewer with a sense of anticipation for what may come next.", "gt-answer": "A. towards the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the people are skating towards the camera.", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "People are seen skating towards the camera.", "gt-answer": "A. towards the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description states that two people are seen skating towards the camera while another two are skating parallel to the screen. Therefore, the correct answer is A. towards the camera.", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "Two people are seen skating towards the camera while another two are skating parallel to the screen.", "gt-answer": "A. towards the camera", "rating": 1 } ] }, "1073873933": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that the monkey is eating.", "chatgpt-answer": "A. eating", "video-llm-prediction": "A monkey is seen eating in the video.", "gt-answer": "B. fighting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that two monkeys are fighting while a third monkey is eating. This implies that the main action happening in the video is the monkeys fighting.", "chatgpt-answer": "B. fighting", "video-llm-prediction": "Two monkeys are seen fighting in the dirt, while a third monkey is seen eating.", "gt-answer": "B. fighting", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the monkey is eating in the video.", "chatgpt-answer": "A. eating", "video-llm-prediction": "A monkey is seen eating in the video.", "gt-answer": "B. fighting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that two monkeys are seen fighting on the ground, while another monkey is seen eating. This means that the main activity happening in the video is the monkeys fighting.", "chatgpt-answer": "B. fighting", "video-llm-prediction": "Two monkeys are seen fighting on the ground, while another monkey is seen eating.", "gt-answer": "B. fighting", "rating": 1 } ] }, "1089810425": { "action": [ { "chatgpt-reasoning": "The video description clearly mentions that a group of people are seen dancing in a pool.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of people are seen dancing in a pool while a man is seen cooking on a grill.", "gt-answer": "C. dancing", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the group of people are dancing in a pool, jumping up and down. They are seen splashing around in the water and the movements are described as energetic and free-flowing.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of people are seen dancing in a pool, with some of them jumping up and down. The video captures the joy and excitement of the moment as the people dance and splash around in the water. The sound of the splashing water and the upbeat music create a lively atmosphere, and the people's movements are energetic and free-flowing. The video showcases the fun and carefree nature of the moment, as the people let go of their inhibitions and enjoy themselves in the water. Overall, the video is a celebration of the joy and freedom of movement", "gt-answer": "C. dancing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a group of people are dancing in a pool, while cooking is happening in the background.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of people are dancing in a pool while a man is cooking in the background.", "gt-answer": "C. dancing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that a group of people are dancing in a pool, with some of them jumping up and down. This indicates that the people in the video are engaged in a dance activity.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of people are dancing in a pool, with some of them jumping up and down.", "gt-answer": "C. dancing", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the video is shot in slow motion.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video shows a group of people having fun in a pool. They are seen splashing water and dancing around. The video is shot in slow motion, and the people are seen enjoying themselves in the water.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the video is in slow motion.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video showcases a group of people having fun in a pool. They are seen splashing water and dancing around. The video is in slow motion, and the people are seen enjoying themselves in the water.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. We cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of people are seen playing in a pool and throwing water at each other.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that \"The video is in slow motion\".", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "A group of people are seen playing in a pool, with some of them jumping up and down. The video is in slow motion, and the people are having a great time.", "gt-answer": "B. normal speed", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description explicitly mentions that the camera pans from left to right, showing the entire scene.", "chatgpt-answer": "A. left to right", "video-llm-prediction": "The video shows a group of people having fun in a pool. They are seen splashing water and dancing around. The camera pans from left to right, showing the entire scene.", "gt-answer": "B. right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the camera pans from left to right, capturing the lively atmosphere of the pool party.", "chatgpt-answer": "A. left to right", "video-llm-prediction": "The video shows a group of people having fun in a pool. They are seen splashing water and dancing around. The camera pans from left to right, capturing the lively atmosphere of the pool party.", "gt-answer": "B. right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a group of people are seen playing in a pool, throwing water at each other and having a good time. The panning direction is not mentioned in the video description, so we cannot determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of people are seen playing in a pool, throwing water at each other and having a good time.", "gt-answer": "B. right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a group of people are seen in a pool, indicating that there is some movement happening in the video. Since the description does not provide specific information about the direction of panning, we cannot determine the exact answer without visual cues from the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of people are seen in a pool, throwing water at each other while dancing.", "gt-answer": "B. right to left", "rating": 0 } ] }, "1077507593": { "action": [ { "chatgpt-reasoning": "The video description clearly states that a chef is seen cooking in a pan on a stove. The actions described, such as adding oil, stirring, and adding liquid, are all associated with the process of cooking.", "chatgpt-answer": "D. cooking", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. The chef adds oil to the pan and stirs it. The chef then adds a liquid to the pan and stirs it again. The chef then adds more liquid to the pan and stirs it once more. The chef then adds more liquid to the pan and stirs it again. The chef then adds more liquid to the pan and stirs it one last time. The chef then takes the pan off the stove and sets it down.", "gt-answer": "D. cooking", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that a chef is cooking in a pan on a stove. It describes the actions of adding oil, stirring, and adding liquid repeatedly.", "chatgpt-answer": "D. cooking", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. The chef adds oil to the pan and stirs it before adding a liquid to the pan. The chef then adds more oil to the pan and stirs it again. The chef continues to stir the pan and adds more liquid to it. The chef then adds more oil to the pan and stirs it again. The chef then adds more liquid to the pan and stirs it again. The chef then adds more oil to the pan and stirs it again. The chef then adds more liquid to the pan and stirs it again. The chef then adds more oil", "gt-answer": "D. cooking", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that a chef is cooking food in the pan on a stove.", "chatgpt-answer": "D. cooking", "video-llm-prediction": "A chef cooks food in a pan on a stove.", "gt-answer": "D. cooking", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that a chef is seen cooking in a pan on a stove. The chef adds oil, seasoning, liquid, and flame to the pan while stirring it. This indicates that the people in the video are cooking.", "chatgpt-answer": "D. cooking", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. The chef adds oil to the pan and stirs it before adding seasoning to the pan. The chef then adds a liquid to the pan and stirs it. The chef continues to stir the pan and adds more liquid to it. The chef then adds a flame to the pan and stirs it. The chef then adds more liquid to the pan and stirs it. The chef then adds more flame to the pan and stirs it. The chef then adds more liquid to the pan and stirs it. The chef then adds more flame to the", "gt-answer": "D. cooking", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description does not mention any specific speed-related information. Therefore, it is not possible to determine the speed of the video based on the given description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. He adds oil to the pan and stirs it around. He then adds a liquid to the pan and stirs it around. The chef then adds more oil to the pan and stirs it around. The chef then adds more liquid to the pan and stirs it around. The chef then adds more oil to the pan and stirs it around. The chef then adds more liquid to the pan and stirs it around. The chef then adds more oil to the pan and stirs it around. The chef then adds more liquid to the pan and stirs it", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the actions performed by the chef while cooking. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. He adds oil to the pan and stirs it before adding a liquid to the pan. The chef then adds a spoonful of flour to the pan and stirs it. The chef then adds a spoonful of water to the pan and stirs it. The chef then adds a spoonful of sauce to the pan and stirs it. The chef then adds a spoonful of butter to the pan and stirs it. The chef then adds a spoonful of salt to the pan and stirs it. The chef then", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. There is no information provided to determine if the video is in normal speed, slow motion, or time-lapse.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. The chef adds oil to the pan and stirs the food. The chef then adds more oil to the pan and stirs the food again. The chef continues to stir the food in the pan.", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any abnormalities or changes in speed, suggesting that the video is running at normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. He adds oil to the pan and stirs the food. The flames rise as he continues to cook.", "gt-answer": "B. slow motion", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description mentions that the chef adds oil to the pan and stirs it. This implies that the skillet is being heated on the stove, but there is no mention of burning in fire or smoking.", "chatgpt-answer": "B. None of both", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. The chef adds oil to the pan and stirs it. The chef then adds a liquid to the pan and stirs it. The chef then adds a spoon to the pan and stirs it. The chef then adds a liquid to the pan and stirs it. The chef then adds a spoon to the pan and stirs it. The chef then adds a liquid to the pan and stirs it. The chef then adds a spoon to the pan and stirs it. The chef then adds a liquid to the pan and stirs it. The", "gt-answer": "C. Smoking", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef adds oil to the pan and stirs it before adding a liquid to the pan. This indicates that the chef starts by heating the pan and adding oil, which would result in smoking before any burning or other events occur.", "chatgpt-answer": "C. Smoking", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. He adds oil to the pan and stirs it before adding a liquid to the pan. The chef then adds a spoonful of flour to the pan and stirs it. The chef then adds a spoonful of liquid to the pan and stirs it. The chef then adds a spoonful of flour to the pan and stirs it. The chef then adds a spoonful of liquid to the pan and stirs it. The chef then adds a spoonful of flour to the pan and stirs it. The chef then", "gt-answer": "C. Smoking", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the pan is smoking first, and then it starts burning in fire. Therefore, the event of smoking happens first.", "chatgpt-answer": "C. Smoking", "video-llm-prediction": "A chef is seen cooking in a pan on the stove. The pan is smoking, and then it starts burning in fire.", "gt-answer": "C. Smoking", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, the chef adds oil to the pan and stirs it first. There is no mention of the skillet burning in fire or smoking in the video description.", "chatgpt-answer": "B. None of both", "video-llm-prediction": "A chef is seen cooking in a pan on a stove. The chef adds oil to the pan and stirs it. The chef then adds a liquid to the pan and stirs it again. The chef then adds a solid to the pan and stirs it. The chef then adds a liquid to the pan and stirs it again. The chef then adds a solid to the pan and stirs it again. The chef then adds a liquid to the pan and stirs it again. The chef then adds a solid to the pan and stirs it again. The chef then adds a liquid to the pan and stirs it", "gt-answer": "C. Smoking", "rating": 0 } ] }, "1107116885": { "action": [ { "chatgpt-reasoning": "The video description states that the man is seen swimming in a pool, shooting an arrow with a bow and arrow, and running in a field. Therefore, the correct answer is C. running, as it encompasses all three activities mentioned in the video description.", "chatgpt-answer": "C. running", "video-llm-prediction": "A man is seen swimming in a pool, then he is shown shooting an arrow with a bow and arrow. Finally, he is seen running in a field.", "gt-answer": "B. shooting an arrow", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is seen swimming in the water, then shooting an arrow with a bow and arrow, and finally running in the field. Therefore, the man is engaged in multiple activities - swimming, shooting an arrow, and running.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen swimming in the water, then he is shown shooting an arrow with a bow and arrow. Finally, he is seen running in the field.", "gt-answer": "B. shooting an arrow", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is swimming in the water while holding a bow and arrow. He then shoots an arrow at a target and runs away. This indicates that the main activity he is engaged in is shooting an arrow.", "chatgpt-answer": "B. shooting an arrow", "video-llm-prediction": "A man is seen swimming in the water while holding a bow and arrow. He then shoots an arrow at a target and runs away.", "gt-answer": "B. shooting an arrow", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is shooting an arrow in a field while holding a bow and arrow in his hand. This indicates that the man is engaged in the activity of shooting an arrow.", "chatgpt-answer": "B. shooting an arrow", "video-llm-prediction": "A man is seen shooting an arrow in a field while wearing a black shirt and a grey vest. He is holding a bow and arrow in his hand and is standing in a field.", "gt-answer": "B. shooting an arrow", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is shot in time-lapse mode, which means it is played at a faster speed than real-time.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "The video shows a man wearing a black hat and a black shirt, who is holding a bow and arrow. He is seen aiming the bow and arrow at a target in the distance. The man then releases the arrow, and it hits the target. The video is shot in a field with trees in the background. The man is wearing a grey vest and has a watch on his left hand. The video is shot in time-lapse mode, and the man is seen shooting the arrow multiple times. The video is shot in slow motion, and the man is seen aiming the bow and arrow at the target. The", "gt-answer": "D. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the pace of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man wearing a black hat and a black shirt, who is holding a bow and arrow. He is seen aiming at a target in the distance and then releasing the arrow. The man then pulls back the arrow and aims at another target. The video captures the man's precision and skill in archery.", "gt-answer": "D. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any specific speed manipulation or alteration. It simply describes the man holding a bow and arrow, aiming at a target, and releasing the arrow. Therefore, we can infer that the pace of the video is normal speed.", "chatgpt-answer": "D. normal speed", "video-llm-prediction": "A man is seen holding a bow and arrow, aiming it at a target, and then releasing the arrow.", "gt-answer": "D. normal speed", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention any specific alteration to the speed of the video. It describes a man shooting a bow and arrow in a field, taking aim, and shooting the arrow towards the target. Since there is no indication of time manipulation, it can be inferred that the video is at normal speed.", "chatgpt-answer": "D. normal speed", "video-llm-prediction": "A man is seen shooting a bow and arrow in a field. He takes aim and shoots the arrow towards the target.", "gt-answer": "D. normal speed", "rating": 1 } ] }, "1059718130": { "speed": [ { "chatgpt-reasoning": "Based on the description, there is no mention of any alteration or manipulation of the video speed. It simply describes a beautiful sunset with a large orange sun setting behind a cloudy sky. Therefore, we can assume that the video is shown at normal speed.", "chatgpt-answer": "B. normal speed", "video-llm-prediction": "The video showcases a beautiful sunset with a large orange sun setting behind a cloudy sky. The sun is seen rising and setting behind the clouds, creating a mesmerizing view. The video also features a large orange sun setting behind a cloudy sky, which is consistent with the video.", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the video has a \"slow-motion effect.\"", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video showcases a beautiful sunset with a large orange sun setting behind a cloudy sky. The sun's rays shine through the clouds, creating a stunning display of colors. The video captures the serene beauty of the sunset, with the sun's rays illuminating the sky and casting a warm glow on the clouds. The video's slow-motion effect allows the viewer to appreciate the intricate details of the sunset, from the delicate wisps of cloud to the vibrant hues of the sky. Overall, the video is a captivating", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of a sunset with a cloudy sky and a bright orange sun.", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. We cannot determine the speed based on the description alone.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a beautiful sunset with a large orange sun setting behind a cloudy sky. The sun is seen setting behind the clouds, and the sky is filled with orange and red hues. The video captures the serene beauty of the sunset, with the sun setting behind the clouds, creating a stunning visual display.", "gt-answer": "C. time-lapse", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description clearly states that the sun is setting in the sky, implying that it is moving from one side to another.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The video showcases the sun setting in the sky, with the sun appearing to move from the left to the right side of the frame. The sun is seen in different positions, including in the middle of the frame and on the left side. The video also features a cloudy sky with the sun shining through the clouds. The video captures the beauty of the sunset and the changing colors of the sky.", "gt-answer": "B. rising", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sun is seen in different positions, from rising to setting and staying in one place. This implies that the sun is moving either in the setting direction or the rising direction.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The video shows a beautiful sunset with the sun setting in the sky. The sun is seen in different positions, from rising to setting and staying in one place. The sky is filled with clouds, and the sun is seen through them. The video captures the beauty of nature and the peacefulness of the moment.", "gt-answer": "B. rising", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the sun is seen setting in the sky. This implies that the sun is moving in the setting direction.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The sun is seen setting in the sky, with clouds moving around it.", "gt-answer": "B. rising", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the sun sets in the sky. This indicates that the sun is moving in the direction of setting.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The sun sets in the sky, and the clouds move around it.", "gt-answer": "B. rising", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that \"The sky gradually gets darker as the sun sets\". This implies that the video's brightness is getting darker.", "chatgpt-answer": "A. getting darker", "video-llm-prediction": "The video showcases a beautiful sunset with the sun setting behind a cloudy sky. The sky gradually gets darker as the sun sets, but the clouds remain the same. The video captures the serene beauty of the sunset and the tranquility of the sky.", "gt-answer": "C. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the brightness of the video. Therefore, we cannot determine what is happening to the video's brightness based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video captures the sunset, with the sun setting behind the clouds. The sky is orange, and the clouds are white. The sun is seen setting behind the clouds, and the sky is orange. The clouds are white, and the sun is seen setting behind them. The video showcases the beauty of the sunset, with the sun setting behind the clouds, and the sky is orange. The clouds are white, and the sun is seen setting behind them. The video is a visual representation of the sunset, with the sun setting behind the clouds, and the sky is orange. The clouds are white, and the sun", "gt-answer": "C. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"The sky is getting darker as the sun sets.\" This implies that the brightness of the video is also getting darker.", "chatgpt-answer": "A. getting darker", "video-llm-prediction": "The video shows a beautiful sunset with the sun setting behind the clouds. The sky is getting darker as the sun sets.", "gt-answer": "C. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun is setting and the clouds are getting darker. This implies that the overall brightness of the video is decreasing.", "chatgpt-answer": "A. getting darker", "video-llm-prediction": "The sun is setting in the sky, and the clouds are getting darker.", "gt-answer": "C. turning brighter", "rating": 0 } ] }, "1083845854": { "speed": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that the video shows the clock with the hands moving around the face and then showing the time. This indicates that the video is playing at normal speed, as it is showing the passage of time in a regular manner.", "chatgpt-answer": "C. normal speed", "video-llm-prediction": "The video shows a close-up of a clock with the hands moving around the face. The video then shows the same clock from different angles. The video ends with the clock showing the time.", "gt-answer": "A. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video transitions to a time-lapse of the clock, showing the hands moving quickly. It then slows down the time-lapse to show the hands moving in slow motion. Finally, the video returns to a normal speed. Therefore, the correct answer is C. normal speed.", "chatgpt-answer": "C. normal speed", "video-llm-prediction": "The video showcases a close-up of a clock, with the camera zooming in on the time and the hands moving around. The video then transitions to a time-lapse of the same clock, with the hands moving quickly around the clock. The video then slows down the time-lapse to show the hands moving around the clock in slow motion. Finally, the video returns to a normal speed, showing the hands moving around the clock.", "gt-answer": "A. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the video is in time-lapse mode and the second hand moves quickly around the clock. This indicates that the video is playing at a faster speed than normal.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "The video shows a close-up of a clock with a red second hand moving around the clock. The video is in time-lapse mode, and the second hand moves quickly around the clock.", "gt-answer": "A. time-lapse", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that there is a time-lapse of the second hand moving around the clock face. This indicates that the video is playing at a faster speed than normal.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "The video showcases a close-up of a clock with a red second hand moving around the clock face. The video also includes a time-lapse of the second hand moving around the clock face.", "gt-answer": "A. time-lapse", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description states that the clock hands are moving in a clockwise direction, but the video itself shows the hands moving in a counterclockwise direction.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video shows a clock with the hands moving in a counterclockwise direction. The video also includes a piece of information that states the hands are moving in a clockwise direction. However, the video itself clearly shows the hands moving in a counterclockwise direction.", "gt-answer": "B. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the clock's hands start by moving in a counterclockwise direction, then move in a stationary position, and finally end with the hands moving in a clockwise direction.", "chatgpt-answer": "B. clockwise", "video-llm-prediction": "The video showcases a close-up of a clock with its hands moving in a counterclockwise direction. The clock's hands move in a stationary position, and the video ends with the hands moving in a clockwise direction.", "gt-answer": "B. clockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that there is a clock with a red second hand. Based on our understanding of clocks, the second hand always moves in a clockwise direction.", "chatgpt-answer": "B. clockwise", "video-llm-prediction": "A clock with a red second hand is shown in the video.", "gt-answer": "B. clockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the clock hands are moving in a counterclockwise direction.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video shows a close-up of a clock with its hands moving in a counterclockwise direction.", "gt-answer": "B. clockwise", "rating": 0 } ] }, "1050618460": { "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only mentions the various stages of bloom and the overall serene experience. Therefore, it is not possible to determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a beautiful white flower blooming in a blue sky. The flower is shown in various stages of bloom, from a bud to a fully bloomed flower. The video also includes a close-up shot of the flower, highlighting its delicate petals and intricate details. The video provides a serene and calming experience, with the sound of the wind and the gentle rustling of the petals. Overall, the video is a beautiful and peaceful representation of the beauty of nature.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the visuals and the focus on the flower. There are no clues or hints to suggest that the video is in a specific speed such as normal speed, time-lapse, or slow motion.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a beautiful white flower with a yellow center, surrounded by green leaves. The flower is shown in various positions, including close-ups of the petals and the center. The video also includes a shot of a blue sky with a few white clouds. The flower is the main focus of the video, and it is shown in different positions and angles, highlighting its beauty and delicate nature. The video is a visual treat for anyone who appreciates the beauty of nature.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video is showcasing the beauty of flowers in bloom. This description does not provide any information about the speed of the video. We cannot determine the speed of the video based on the given video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video showcasing the beauty of flowers in bloom.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. Therefore, it is not possible to determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video showcasing the beauty of flowers in bloom.", "gt-answer": "B. time-lapse", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description states that the flower bud turns into a full bloom, then withers and wilts, and finally remains as a bud. This implies that the flowers are undergoing a transformation from bud to full bloom and then back to bud.", "chatgpt-answer": "D. remaining as buds", "video-llm-prediction": "The video showcases the process of a flower bud turning into a full bloom. The video starts with a close-up shot of a flower bud, which then transitions to a full bloom flower. The video then shows the flower withering and wilting, and finally, it remains as a bud. The video highlights the beauty of the flower and the process of its transformation.", "gt-answer": "C. turning into full bloom", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the flower bud transitions into a full bloom, then withers and wilts, and finally remains as buds. Therefore, the correct answer is D. remaining as buds.", "chatgpt-answer": "D. remaining as buds", "video-llm-prediction": "The video showcases the process of a flower bud turning into a full bloom. The video starts with a close-up of a flower bud, which then transitions to a full bloom. The video then shows the flower bud withering and wilting, which is followed by the bud turning into a full bloom. The video ends with the flower bud remaining as buds.", "gt-answer": "C. turning into full bloom", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the flower bud is turning into a full bloom, which means the flowers are going through the process of blooming and opening up.", "chatgpt-answer": "C. turning into full bloom", "video-llm-prediction": "The video shows the process of a flower bud turning into a full bloom.", "gt-answer": "C. turning into full bloom", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the flowers are going through the process of blooming, from buds to full bloom, and then withering and wilting. This means that the flowers are going through a cycle where they start as buds, turn into full bloom, and eventually wither.", "chatgpt-answer": "D. remaining as buds", "video-llm-prediction": "A video showcases the process of flowers blooming, from buds to full bloom, and then withering and wilting.", "gt-answer": "C. turning into full bloom", "rating": 0 } ] }, "1083113449": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the video is shot in slow motion.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video showcases a tall building with many windows at night. The camera pans around the building, and the lights inside the building are on. The video is shot in slow motion, and the lights inside the building are on.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the visual aspects of the building and the camera movement. Therefore, there is no way to determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a tall building with many windows at night. The camera pans around the building, and the lights inside the building are on. The video captures the beauty of the building at night, with the lights shining brightly against the dark sky. The camera movement is smooth and steady, providing a clear view of the building's exterior. The video is shot in a way that highlights the building's architectural features, such as the windows and the facade. Overall, the video is a captivating visual experience that showcases the building's beauty at night.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. Therefore, it is not possible to determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of a tall building at night with a green light on the top. The building is lit up with many windows and a green light on the top.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. We cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a tall building with many windows at night. The camera pans around the building, and the lights inside the building are on. The video captures the beauty of the building at night.", "gt-answer": "B. time-lapse", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the sky is seen getting darker. This means that the brightness of the sky is decreasing.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The video shows a building at night with its lights on. The sky is seen getting darker, and the building's lights are still on.", "gt-answer": "C. getting darker", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the building is located in a city at night, and the camera pans around the building. This implies that the scene is set during nighttime. Therefore, the sky's appearance would be \"getting darker\" as the video progresses.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The video showcases a tall building with a blue tinted glass exterior, illuminated by a blue light from the inside. The building is located in a city at night, and the camera pans around the building, capturing its unique architectural features. The video also includes a shot of a person walking in front of the building, adding a sense of scale and human presence to the scene.", "gt-answer": "C. getting darker", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the sky is getting darker, indicating a change in brightness.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The sky is getting darker.", "gt-answer": "C. getting darker", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the sky is getting darker, indicating a change in its appearance.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The sky is getting darker, but it is still bright.", "gt-answer": "C. getting darker", "rating": 1 } ] }, "1091143117": { "speed": [ { "chatgpt-reasoning": "The video description explicitly mentions that there is a time-lapse sequence in the video, highlighting the natural movements of the eye.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "The video begins with a close-up shot of a person's eye, showcasing the intricate details of the eyelashes and eyebrow. The camera then pans out to reveal the entire eye, capturing the vibrant colors and textures of the iris and surrounding tissue. The video then transitions to a time-lapse sequence, highlighting the natural movements of the eye as it blinks and shifts in focus. The camera captures the eye's dynamic nature, showcasing the fluidity of the eyelids and the movement of the ey", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the video includes a time-lapse effect, which allows the viewer to observe the eye's movement over time.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "The video showcases a close-up of a person's eye, with a focus on the iris and the surrounding area. The camera captures the eye's movement as it blinks, and the viewer can see the intricate details of the iris. The video also includes a time-lapse effect, which allows the viewer to observe the eye's movement over time. The video provides a detailed and intimate look at the eye, highlighting its beauty and complexity.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the close-up of a person's eye with a focus on the blue color. Therefore, it is not possible to determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a close-up of a person's eye, with a focus on the blue color of the eye.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The description of the video does not provide any information about the speed of the video. It only describes the content and focus of the video, which is about a person's eye and the process of inserting a contact lens. Therefore, it is not possible to determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a close-up of a person's eye, with a focus on the eye's blue color. The video also features a person's hand holding a contact lens, which is inserted into the eye. The video emphasizes the importance of eye care and hygiene.", "gt-answer": "C. normal speed", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the person's eye is initially closed, then opens, and finally closes again. This indicates a change in the state of the eye from closed to open and back to closed.", "chatgpt-answer": "A. from closed to open", "video-llm-prediction": "The video shows a close-up of a person's eye, which is initially closed. The person then opens their eye, and the camera zooms in to show the details of the eye. The video ends with the person closing their eye again.", "gt-answer": "A. from closed to open", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the eye is initially closed and then opens to reveal its contents. It also states that the entire eye is blurry and appears to be turning red. This indicates that the eye is going through multiple changes, including opening, becoming blurry, and turning red.", "chatgpt-answer": "A. from closed to open", "video-llm-prediction": "The video showcases a close-up of an eye, which is initially closed and then opens to reveal its contents. The camera then pans out to show the entire eye, which is blurry and appears to be turning red.", "gt-answer": "A. from closed to open", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the eye is turning red.", "chatgpt-answer": "B. turning red", "video-llm-prediction": "A close-up of an eye is shown, and it is revealed that the eye is turning red.", "gt-answer": "A. from closed to open", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the eye is shown from different angles, both from the inside and outside. It also mentions that the video shows a close-up perspective of the eye. None of the choices can be inferred from this information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person's eye is shown in the video, and it is seen from different angles. The eye is shown from the inside, and it is also shown from the outside. The video also shows the eye from a close-up perspective.", "gt-answer": "A. from closed to open", "rating": 0 } ] }, "1100329207": { "action": [ { "chatgpt-reasoning": "The video description mentions that the sheep are seen running around and eating grass. It also states that the video shows the sheep sleeping in the field.", "chatgpt-answer": "A. running, C. eating grass", "video-llm-prediction": "The video shows a large herd of sheep grazing in a field. The sheep are seen running around and eating grass. The video also shows the sheep sleeping in the field.", "gt-answer": "A. running", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sheep are seen running, sleeping, and eating grass in the field.", "chatgpt-answer": "A. running, B. sleeping, C. eating grass", "video-llm-prediction": "The video showcases a large herd of sheep grazing in a vast field. The sheep are seen running and sleeping in the field, and they are also seen eating grass. The video captures the peaceful and serene environment of the field, with the sheep grazing and enjoying the natural surroundings. The video provides a glimpse into the daily life of the sheep and their natural behavior in a peaceful environment.", "gt-answer": "A. running", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sheep are seen running, sleeping, and eating grass in the same field. Therefore, the correct answer is C. eating grass.", "chatgpt-answer": "C. eating grass", "video-llm-prediction": "A herd of sheep is seen running in a field, then they are seen sleeping. Later, they are seen eating grass in the same field.", "gt-answer": "A. running", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the herd of sheep is grazing in a field, which implies that they are eating grass.", "chatgpt-answer": "C. eating grass", "video-llm-prediction": "A herd of sheep is seen grazing in a field.", "gt-answer": "A. running", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that the sheep are seen walking around in the field. Since we know that the sheep are the focus of the video and they are moving around, it is likely that the camera is also moving to follow the sheep.", "chatgpt-answer": "D. moving forward", "video-llm-prediction": "The video shows a large herd of sheep grazing in a field. The sheep are seen walking around and grazing on the grass. The video also shows a man herding the sheep with a dog. The sheep are seen walking around in the field, and the man is seen herding them with the dog. The video captures the peaceful and serene atmosphere of the countryside, with the sound of the wind and the occasional bleating of the sheep. The video is a beautiful representation of the simple life of a farmer and the beauty of nature.", "gt-answer": "D. moving forward", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, it is mentioned that the camera captures the sheep as they move around the field. Since the description does not specify any specific movement or direction other than the camera capturing the movements of the sheep, it is not possible to determine the exact direction of the camera view.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a large herd of sheep grazing in a vast field. The camera captures the sheep as they move around the field, with some walking closer to the camera and others further away. The sheep are seen grazing on the grass, and the camera captures their movements as they continue to graze. The video provides a peaceful and serene view of the countryside, with the sound of the wind and the occasional bleat of the sheep adding to the tranquility. Overall, the video is a beautiful depiction of the natural world and the simple beauty of the countrys", "gt-answer": "D. moving forward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a herd of sheep is seen grazing in a field. It doesn't provide any information about the movement of the camera view.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A herd of sheep is seen grazing in a field.", "gt-answer": "D. moving forward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the field, indicating a movement of the camera. It does not specify the direction of the camera movement explicitly.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A herd of sheep is seen grazing in a field. The camera pans around the field, showing the sheep in different positions. The sky is blue and clear, and the field is green and lush. The sheep are seen grazing on the grass, and some are lying down. The camera captures the peacefulness of the scene, with the sound of the wind and the occasional bleat of the sheep.", "gt-answer": "D. moving forward", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description does not mention anything specific about the speed of the video. It only provides information about the content and atmosphere of the video, but no details regarding its speed.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a large herd of sheep grazing in a field. The sheep are seen walking around and grazing on the grass. The video also shows the sheep walking around in the field. The video is shot in a serene and peaceful environment with a beautiful view of the mountains in the background. The video is shot in a way that captures the beauty of the landscape and the peacefulness of the animals. The video is a perfect representation of the beauty of nature and the peacefulness of the animals.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The description of the video does not mention anything about the speed of the video. It only describes the actions and behavior of the sheep in the field. Therefore, there is no information provided to determine the speed of the video.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a large herd of sheep grazing in a vast, open field. The camera captures the serene landscape, with the sheep scattered throughout the field, grazing peacefully. The camera then focuses on a specific sheep, highlighting its grazing behavior. The video then transitions to a panoramic view of the entire field, showcasing the vastness of the landscape and the peacefulness of the scene. The camera then zooms in on the sheep, providing a close-up view of their grazing behavior. The video then transitions to a panoramic view of", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed based on the provided information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A large herd of sheep is seen grazing in a field.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the actions and movements of the sheep. Therefore, it is not possible to determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A large herd of sheep is seen grazing in a field. The camera pans around the field, showing the sheep in various positions. The video ends with the sheep walking away.", "gt-answer": "B. normal speed", "rating": 0 } ] }, "1089201973": { "action": [ { "chatgpt-reasoning": "The video description mentions that the people are playing football on a field, running around, passing the ball, and attempting to score goals. This implies that they are actively involved in kicking the football.", "chatgpt-answer": "B. kicking football", "video-llm-prediction": "The video showcases a group of people playing football on a field. The players are seen spinning, throwing, and kicking the ball around. The video captures the players' movements and actions as they play the game. The players are seen running around the field, passing the ball to each other, and attempting to score goals. The video also shows the players' teamwork and coordination as they work together to play the game. Overall, the video provides a glimpse into the exciting and dynamic world of football.", "gt-answer": "B. kicking football", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the players are seen spinning, throwing, and stopping the football, while kicking it around. This indicates that the people in the video are engaging in multiple activities involving the football.", "chatgpt-answer": "A. stopping football, B. kicking football, C. throwing football", "video-llm-prediction": "The video showcases a group of people playing football on a field. The players are seen spinning, throwing, and stopping the football, while kicking it around. The video captures the players' movements and the ball's trajectory, highlighting the excitement and energy of the game.", "gt-answer": "B. kicking football", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is spinning a football on the ground, throwing it, and there are several people kicking the football. One person is also mentioned to be stopping it. These actions imply that the people in the video are both kicking and stopping the football.", "chatgpt-answer": "B. kicking football", "video-llm-prediction": "A person is seen spinning a football on the ground, and then throwing it. The video shows several people kicking the football, and one person stopping it.", "gt-answer": "B. kicking football", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that one person is spinning a football, another person is throwing it, another person is kicking it, and another person is stopping it.", "chatgpt-answer": "A. stopping football, B. kicking football, C. throwing football, D. spinning football", "video-llm-prediction": "A person is seen spinning a football in the air, and then throws it. Another person is seen kicking the football, and another person is seen stopping the football.", "gt-answer": "B. kicking football", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "From the description, there is no indication that the video is in time-lapse or slow motion. The actions described are happening in a continuous and realistic manner, suggesting that the video is at normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "A soccer player kicks the ball towards the goal, and the goalkeeper attempts to block it. The ball hits the ground and bounces away from the goal. The player then kicks the ball again, and the goalkeeper tries to block it again. The ball hits the ground and bounces away from the goal. The player kicks the ball again, and the goalkeeper tries to block it again. The ball hits the ground and bounces away from the goal. The player kicks the ball again, and the goalkeeper tries to block it again. The ball hits the ground and bounces away", "gt-answer": "C. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any alteration or acceleration of the video speed. It simply describes the actions and movements in the video without any indication of a change in speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "A player kicks a soccer ball on a field, and the ball flies through the air. The player's foot is shown in close-up, and the ball is seen in motion. The video ends with the player's foot kicking the ball.", "gt-answer": "C. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a soccer player kicks the ball on a field and the ball flies through the air. This implies that the actions in the video are happening in real-time, at a regular speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "A soccer player kicks the ball on a field, and the ball flies through the air.", "gt-answer": "C. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that \"The player's feet are shown in slow motion, and the ball is kicked with great force.\" This indicates that the video is in slow motion.", "chatgpt-answer": "C. slow motion", "video-llm-prediction": "A player kicks a soccer ball on a field, and the ball flies through the air. The player's feet are shown in slow motion, and the ball is kicked with great force. The player's movements are fluid and graceful, and the ball is kicked with precision. The field is surrounded by a lush green landscape, and the sun is shining brightly in the sky. The player's form is excellent, and the ball is kicked with great power. The player's movements are fluid and graceful, and the ball is kicked with precision. The player's form", "gt-answer": "C. slow motion", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that the person kicks the ball from the right side of the field towards the left side. This indicates that the ball is moving from right to left.", "chatgpt-answer": "B. moving from right to left", "video-llm-prediction": "A person is seen kicking a soccer ball on a field. The ball is kicked from the right side of the field towards the left side. The person kicks the ball with their right foot and the ball flies through the air. The person kicks the ball again and it flies through the air. The person kicks the ball again and it flies through the air. The person kicks the ball again and it flies through the air. The person kicks the ball again and it flies through the air. The person kicks the ball again and it flies through the air. The person k", "gt-answer": "A. moving from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the ball is flying towards the goal. Since the goal is typically located on one side of the field, we can infer that the ball is moving either from left to right or from right to left.", "chatgpt-answer": "A. moving from left to right", "video-llm-prediction": "A player kicks a football on a field, and the ball flies towards the goal. The player's foot is shown in close-up, and the ball is seen flying through the air. The player's foot is shown again, and the ball is seen flying towards the goal. The player's foot is shown again, and the ball is seen flying towards the goal. The player's foot is shown again, and the ball is seen flying towards the goal. The player's foot is shown again, and the ball is seen flying towards the goal. The player's foot is shown again, and the", "gt-answer": "A. moving from left to right", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the soccer player \"kicks\" the ball, which implies that the ball is being propelled in a certain direction. It does not mention any stationary position of the ball. Therefore, we can infer that the ball is moving.", "chatgpt-answer": "A. moving from left to right", "video-llm-prediction": "A soccer player kicks the ball on a field.", "gt-answer": "A. moving from left to right", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ball is seen in the air multiple times. This indicates that the ball is moving.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A soccer player kicks a ball on a field, and the ball is seen in the air. The player's feet are shown in the air, and the ball is seen in the air. The player's feet are shown in the air, and the ball is seen in the air. The player's feet are shown in the air, and the ball is seen in the air. The player's feet are shown in the air, and the ball is seen in the air. The player's feet are shown in the air, and the ball is seen in the air. The player's feet are shown", "gt-answer": "A. moving from left to right", "rating": 0 } ] }, "1034736653": { "action": [ { "chatgpt-reasoning": "The video description clearly indicates that the women are running on a track, so the correct answer is C. running.", "chatgpt-answer": "C. running", "video-llm-prediction": "The video shows a group of women running on a track, with one woman leading the pack. The other women are seen running behind her. The video also shows a woman in a blue shirt running on the track. The video captures the energy and athleticism of the women as they run and exercise.", "gt-answer": "C. running", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the women are participating in a track and field event, running down the track and jumping into a pit.", "chatgpt-answer": "C. running", "video-llm-prediction": "The video showcases a group of women who are participating in a track and field event. The women are seen running down the track and jumping into a pit. The video captures the athleticism and grace of the women as they compete in the event. The women are dressed in athletic attire and are seen running with determination and focus. The video also highlights the precision and skill required to successfully complete the event. Overall, the video is a testament to the strength, agility, and athleticism of the women participating in the track and field event.", "gt-answer": "C. running", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the woman athletes are running. Neither cycling, swimming, nor dancing can be inferred from the given information.", "chatgpt-answer": "C. running", "video-llm-prediction": "A woman is seen running on a track while another woman is seen running on a field.", "gt-answer": "C. running", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the women athletes are running down a track and one of them jumping into a pile of sand, which indicates that they are participating in a running event.", "chatgpt-answer": "C. running", "video-llm-prediction": "The video showcases a group of women who are all athletes. They are seen running down a track, with one of them jumping into a pile of sand. The video captures the athletes in action, showcasing their skills and athleticism.", "gt-answer": "C. running", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the woman is running at a normal speed. There is no mention of her running faster or slower than normal.", "chatgpt-answer": "A. Normal speed", "video-llm-prediction": "The video shows a woman running on a track, and she is the only one running. She is wearing a pink shirt and black shorts. The woman is running at a normal speed, and she is the only one running. The video is shot from a distance, and the woman is running alone.", "gt-answer": "C. The fastest speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is running at a normal speed. It specifically states that \"she is running at a normal speed\".", "chatgpt-answer": "A. Normal speed", "video-llm-prediction": "The video shows a woman running on a track, and she is the only one who is running. She is wearing a pink shirt and blue shorts. The woman is running at a normal speed, and she is the only one who is running. The video is shot from a distance, and the woman is the only one who is running.", "gt-answer": "C. The fastest speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman runs on a track and jumps into a pile of sand. This suggests that the woman is performing a high-speed activity, as running and jumping generally require a certain level of speed and momentum. Therefore, the answer would be C. The fastest speed, as the woman is likely running at a fast pace in order to perform the jump.", "chatgpt-answer": "C. The fastest speed", "video-llm-prediction": "A woman runs on a track and jumps into a pile of sand.", "gt-answer": "C. The fastest speed", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is running at different speeds, including normal, slow, and fast speeds. It also states that the camera captures her from different angles. Since the question asks for the speed of the woman closest to the camera, we can assume that the camera captures the woman at multiple points in the video. Therefore, based on the information provided, the correct answer would be:", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a woman running on a track, and the camera captures her from different angles. The woman is seen running at different speeds, including normal, slow, and fast speeds. The video also shows the woman running on a track with other people.", "gt-answer": "C. The fastest speed", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description clearly states that the women are initially running from right to left, and then they start running in circles.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "The video shows a group of women running on a track. They are seen running from right to left, and then they start running in circles. The video captures the athleticism and endurance of the women as they push themselves to their limits. The sound of their footsteps and the cheers of the crowd add to the excitement of the moment. The video is a testament to the power of physical activity and the importance of staying active.", "gt-answer": "C. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the women are seen running from right to left initially, and then they turn around and run in circles.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "The video shows a group of women running on a track. They are seen running from right to left, and then they turn around and run in circles. The video captures the athleticism and endurance of these women as they push themselves to their limits. The sound of their footsteps and the cheers of the crowd can be heard in the background, adding to the excitement of the moment. Overall, the video is a testament to the power of physical activity and the importance of staying active.", "gt-answer": "C. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the women are passing each other and continuing to run. This indicates that they are running in opposite directions. Since it doesn't mention about circular motion, option B can be eliminated. The specific direction is not mentioned (e.g., clockwise or counterclockwise), so we can assume it's a simple back and forth motion on a track. Therefore, the correct answer is A. from right to left.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "A group of women run on a track, passing each other and continuing to run.", "gt-answer": "C. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the group of women are running in circles. This means that they are continuously moving in a circular path, without any mentioned direction from right to left or from left to right.", "chatgpt-answer": "B. in circles", "video-llm-prediction": "A group of women are seen running on a track, with one of them leading the pack. They are running in circles and passing the baton to each other.", "gt-answer": "C. from left to right", "rating": 0 } ] }, "1098153561": { "speed": [ { "chatgpt-reasoning": "The video description does not mention any specific manipulation of the speed of the video, such as time-lapse or slow motion. It simply describes the scenery and the movement of a person walking through the forest. Therefore, it can be inferred that the video is in normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves scattered throughout. The camera captures the beauty of the forest, highlighting the vibrant colors of the leaves. The video also features a person walking through the forest, adding a sense of movement and life to the scene. The camera captures the person's movement, providing a sense of scale and depth to the forest. The video ends with a shot of the sun shining through the trees, creating a warm and inviting atmosphere.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any alteration in the speed or time manipulation. It simply describes the scenery in a narrative style. Therefore, we can assume that the video is presented in normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves scattered throughout. The camera pans around the forest, capturing the beauty of the trees and the warmth of the sun. The video ends with a shot of the sun setting, casting a warm glow over the forest.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. We cannot determine whether the video is at normal speed, time-lapse, or in slow motion based on the given description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves, and the camera captures the beauty of the trees and the sun shining through.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, there is no mention of any manipulation or alteration of the video speed. It simply describes the beauty of the forest and the changing of the seasons. Therefore, the video is most likely at normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves scattered throughout. The camera captures the beauty of the forest, with the sun shining through the trees, creating a warm and inviting atmosphere. The video highlights the natural beauty of the forest and the changing of the seasons.", "gt-answer": "B. time-lapse", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the leaves are changing color from green to red and some are falling off the trees.", "chatgpt-answer": "C. changing color from green to red", "video-llm-prediction": "The video showcases the beauty of autumn in a forest. The camera pans around the trees, capturing the vibrant colors of the leaves. The leaves are seen changing from green to red, and some are falling off the trees. The camera also captures the sun shining through the trees, creating a warm and inviting atmosphere. The video highlights the natural beauty of the forest during the fall season.", "gt-answer": "C. changing color from green to red", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the leaves are changing and highlights their vibrant yellow color, indicating a change in color from green to yellow. It doesn't mention anything about changing shape, falling off, or growing larger.", "chatgpt-answer": "C. changing color from green to red", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves scattered throughout. The camera pans around the forest, highlighting the beauty of the changing leaves. The video captures the essence of nature's beauty and the changing seasons.", "gt-answer": "C. changing color from green to red", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the leaves in the forest are yellowing, indicating a change in color. This suggests that the leaves are changing color, not any of the other options listed.", "chatgpt-answer": "C. changing color from green to red", "video-llm-prediction": "The video shows a forest with yellowing leaves and a sun shining through the trees.", "gt-answer": "C. changing color from green to red", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the leaves are changing color from green to red and falling off the trees.", "chatgpt-answer": "B. falling off", "video-llm-prediction": "The video showcases the beauty of autumn as the leaves change from green to red and fall off the trees. The camera pans around the forest, capturing the vibrant colors of the leaves and the sun shining through the trees. The video ends with a shot of the forest floor covered in leaves.", "gt-answer": "C. changing color from green to red", "rating": 0 } ] }, "1084153195": { "action": [ { "chatgpt-reasoning": "The video description mentions that the dolphins are swimming, jumping, sleeping, and diving in the water.", "chatgpt-answer": "A. Diving, B. Swimming, C. Sleeping, D. Jumping", "video-llm-prediction": "The video shows two dolphins swimming in the ocean. They are seen jumping and swimming around. The dolphins are also seen sleeping and diving. The video captures the beauty and grace of these aquatic animals in their natural habitat.", "gt-answer": "B. Swimming", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dolphins are swimming in the water. Additionally, it mentions that one of the dolphins is jumping out of the water, indicating movement and activity.", "chatgpt-answer": "B. Swimming", "video-llm-prediction": "The video showcases two dolphins swimming in the ocean, with one dolphin jumping out of the water. The dolphins are seen swimming and interacting with each other, creating a serene and peaceful atmosphere. The video captures the beauty and grace of these aquatic creatures, as they move gracefully through the water. The sound of the waves crashing against the shore and the splashing of the dolphins adds to the overall ambiance of the video. Overall, the video provides a calming and relaxing experience for the viewer, allowing them to appreciate the beauty", "gt-answer": "B. Swimming", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the dolphins are \"swimming\" in the ocean.", "chatgpt-answer": "B. Swimming", "video-llm-prediction": "Two dolphins are seen swimming in the ocean.", "gt-answer": "B. Swimming", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the dolphins are seen swimming in the ocean and then they suddenly jump out of the water.", "chatgpt-answer": "D. Jumping", "video-llm-prediction": "Two dolphins are seen swimming in the ocean, and they suddenly jump out of the water.", "gt-answer": "B. Swimming", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description clearly states that the dolphins are swimming towards the shore.", "chatgpt-answer": "A. swimming towards the shore", "video-llm-prediction": "The video shows two dolphins swimming towards the shore. They are seen swimming in the water, and their fins are visible. The dolphins are seen swimming in the water, and their fins are visible. The dolphins are seen swimming in the water, and their fins are visible. The dolphins are seen swimming in the water, and their fins are visible. The dolphins are seen swimming in the water, and their fins are visible. The dolphins are seen swimming in the water, and their fins are visible. The dolphins are seen swimming in the", "gt-answer": "A. swimming towards the shore", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the dolphins are swimming towards the shore, hovering in one place, and swimming away from the shore.", "chatgpt-answer": "A. swimming towards the shore, B. hovering in one place, C. swimming away from the shore", "video-llm-prediction": "The video showcases two dolphins swimming towards the shore, then hovering in one place, and finally swimming away from the shore.", "gt-answer": "A. swimming towards the shore", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dolphins initially swim towards the shore, then hover in one place, and finally swim away from the shore.", "chatgpt-answer": "A. swimming towards the shore, B. hovering in one place, C. swimming away from the shore", "video-llm-prediction": "Two dolphins swim towards the shore, then hover in one place before swimming away from the shore.", "gt-answer": "A. swimming towards the shore", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the dolphins initially swim towards the shore, then hover in one place before swimming away from the shore.", "chatgpt-answer": "A. swimming towards the shore, B. hovering in one place, C. swimming away from the shore", "video-llm-prediction": "Two dolphins swim towards the shore, then hover in one place before swimming away from the shore.", "gt-answer": "A. swimming towards the shore", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description does not provide explicit information about the rate of movement in the video. It only mentions that the dolphins are seen swimming in the water and then swimming towards the camera, but it doesn't specify the speed. Therefore, there is not enough information to determine the rate of movement.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows two dolphins swimming in the ocean. They are seen swimming next to each other and then swimming away from each other. The dolphins are seen swimming in the water and then they swim towards the camera. The video captures the beauty of the ocean and the graceful movements of the dolphins. The dolphins are seen swimming in the water and then they swim towards the camera. The video provides a serene and peaceful view of the ocean and the dolphins.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that dolphins are swimming in the ocean, but it does not provide any specific information about the rate of movement. Therefore, we cannot determine the rate of movement from the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Dolphins swimming in the ocean.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the dolphins are swimming in the ocean, but it does not provide any information about the speed of their movement. Therefore, we cannot determine the rate of movement based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows two dolphins swimming in the ocean.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that dolphins are swimming in the ocean, but it does not provide any information about their rate of movement. Therefore, we cannot determine the rate of movement based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Dolphins swimming in the ocean.", "gt-answer": "C. normal speed", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that the dolphins first swim towards the shore, where they are fed with fish. Then, they swim in circles and enjoy the fish. Therefore, the correct sequence of events involving dolphins is swimming towards the shore, then getting fed with fish.", "chatgpt-answer": "A. swimming towards the shore, then getting fed with fish", "video-llm-prediction": "The video shows two dolphins swimming towards the shore, where they are fed with fish. The dolphins then swim in circles, enjoying the fish.", "gt-answer": "A. swimming towards the shore, then getting fed with fish", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the dolphins first swim towards the shore, where they are fed fish. Then, they swim in circles, enjoying the water.", "chatgpt-answer": "A. swimming towards the shore, then getting fed with fish", "video-llm-prediction": "The video shows two dolphins swimming towards the shore, where they are fed fish. They then swim in circles, enjoying the water.", "gt-answer": "A. swimming towards the shore, then getting fed with fish", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the dolphins are first swimming towards the shore and then getting fed with fish.", "chatgpt-answer": "A. swimming towards the shore, then getting fed with fish", "video-llm-prediction": "Dolphins swimming towards the shore, then getting fed with fish.", "gt-answer": "A. swimming towards the shore, then getting fed with fish", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the dolphins are seen swimming towards the shore, then they get fed with fish. After that, they swim in circles before swimming towards the shore again.", "chatgpt-answer": "A. swimming towards the shore, then getting fed with fish", "video-llm-prediction": "Two dolphins are seen swimming towards the shore, and then they get fed with fish. They swim in circles, and then they swim towards the shore again.", "gt-answer": "A. swimming towards the shore, then getting fed with fish", "rating": 1 } ] }, "1054717541": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is kneading dough and then proceeds to cut the dough and grill it.", "chatgpt-answer": "B. kneading dough", "video-llm-prediction": "A man is seen kneading dough in a video. He then proceeds to cut the dough and grill it.", "gt-answer": "B. kneading dough", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is kneading dough and then proceeds to cut the dough and grill it.", "chatgpt-answer": "B. kneading dough", "video-llm-prediction": "A man is seen kneading dough in a video. He then proceeds to cut the dough and grill it.", "gt-answer": "B. kneading dough", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is seen kneading dough, cutting it, and grilling it.", "chatgpt-answer": "A. cutting dough", "video-llm-prediction": "A man is seen kneading dough, cutting it, and grilling it.", "gt-answer": "B. kneading dough", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen kneading dough, cutting it, and grilling it.", "chatgpt-answer": "The person is doing all three actions mentioned in the description - kneading dough, cutting it, and grilling it. Therefore, the correct answer is: A. cutting dough, B. kneading dough, C. grilling dough.", "video-llm-prediction": "A man is seen kneading dough, cutting it, and grilling it.", "gt-answer": "B. kneading dough", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description does not mention anything about the speed or any special effects applied. It simply describes the actions of the man kneading, flattening, rolling, and adding flour to the dough. Therefore, we can assume that the video is playing at normal speed.", "chatgpt-answer": "C. at normal speed", "video-llm-prediction": "A man is shown kneading dough on a table. He then proceeds to flatten the dough and adds more flour to it. The man then rolls the dough out and adds more flour to it. He then kneads the dough again and rolls it out once more. The man then adds more flour to the dough and kneads it again. Finally, the man rolls the dough out one last time.", "gt-answer": "A. in slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed at which the video is playing. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a man kneading dough on a floured surface. He then shapes the dough into a ball and places it on a floured surface. The man then kneads the dough again and shapes it into a ball. He then places the dough on a floured surface and kneads it once more. The video ends with the man placing the dough on a floured surface and kneading it one final time.", "gt-answer": "A. in slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed or any special effects in the video. It only describes the actions of a man kneading dough. Therefore, we can assume that the video is playing at normal speed.", "chatgpt-answer": "C. at normal speed", "video-llm-prediction": "A man is seen kneading dough on a table. He then adds flour to the dough and kneads it again.", "gt-answer": "A. in slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, there is no evidence to suggest that the video is playing in slow motion or with a time-lapse effect. As a result, we can assume that the video is playing at normal speed.", "chatgpt-answer": "C. at normal speed", "video-llm-prediction": "A man is shown kneading dough on a table. He then adds flour to the dough and kneads it again. The video ends with the man showing off the finished product.", "gt-answer": "A. in slow motion", "rating": 0 } ] }, "1081092839": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the sun is seen setting in the distance, which indicates that the direction of the sun is descending.", "chatgpt-answer": "A. descending", "video-llm-prediction": "The video captures the serene beauty of a snowy landscape during a beautiful sunset. The sun is seen setting in the distance, casting a warm glow over the snow-covered trees. The camera then pans to the left, showcasing the vastness of the snowy field. The sun continues to set, and the sky gradually turns from orange to purple. The video ends with the sun completely setting, leaving behind a stunning view of the snowy landscape.", "gt-answer": "A. descending", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the sun is setting in the sky. This indicates that the sun is descending.", "chatgpt-answer": "A. descending", "video-llm-prediction": "The video showcases a serene winter landscape with a beautiful sunset in the background. The sun is seen setting in the sky, casting a warm glow over the snow-covered trees. The video captures the tranquility of the scene, with the sun setting in the distance and the snow-covered trees standing tall. The video is a perfect representation of the beauty of winter and the peacefulness of nature.", "gt-answer": "A. descending", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sun is setting in the sky. When the sun sets, it appears to be descending below the horizon.", "chatgpt-answer": "A. descending", "video-llm-prediction": "The sun is seen setting in the sky, and the trees are silhouetted against the sky.", "gt-answer": "A. descending", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sun sets in the background, indicating that it is descending.", "chatgpt-answer": "A. descending", "video-llm-prediction": "The video captures the serene beauty of a snowy landscape during a sunset. The sun sets in the background, casting a warm glow on the snow-covered trees. The video showcases the tranquility of the scene, with the sun setting in the background and the snow-covered trees standing tall.", "gt-answer": "A. descending", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description does not mention any specific speed at which the video is playing. Therefore, it is not possible to determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene winter landscape with a beautiful sunset in the background. The camera captures the sun setting in the distance, casting a warm glow on the snowy landscape. The camera then pans to the left, revealing a snowy field with trees in the background. The camera then pans to the right, revealing a snowy field with trees in the background. The camera then pans to the left, revealing a snowy field with trees in the background. The camera then pans to the right, revealing a snowy field with trees in the background. The camera then p", "gt-answer": "A. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "Based on the description, there is no specific mention of the speed of the video. Therefore, it cannot be determined from the information given.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene winter landscape with a beautiful sunset in the background. The camera pans around the snowy field, capturing the beauty of the sunset and the surrounding trees. The video ends with a shot of the sunset.", "gt-answer": "A. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene winter landscape with snow-covered trees and a beautiful sunset.", "gt-answer": "A. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. None of the choices can be determined based on the given description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene winter landscape with a beautiful sunset in the background. The camera pans around the snowy field, capturing the stunning colors of the sky. The video also features a tree with branches covered in snow, adding to the beauty of the scene.", "gt-answer": "A. time-lapse", "rating": 0 } ] }, "1059462749": { "action": [ { "chatgpt-reasoning": "The video description states that a man is seen climbing down a ladder while another man is reading a book. This indicates that the action being performed by the person is climbing down a ladder.", "chatgpt-answer": "C. climbing down a ladder", "video-llm-prediction": "A man is seen climbing down a ladder while another man is reading a book.", "gt-answer": "C. climbing down a ladder", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a man is seen climbing down a ladder. None of the other choices (reading a book, cooking, riding a bike) are mentioned or indicated in the video description.", "chatgpt-answer": "C. climbing down a ladder", "video-llm-prediction": "A man is seen climbing down a ladder while wearing blue jeans and a blue shirt. He is also wearing shoes.", "gt-answer": "C. climbing down a ladder", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the person is climbing down a ladder.", "chatgpt-answer": "C. climbing down a ladder", "video-llm-prediction": "A person is seen climbing down a ladder.", "gt-answer": "C. climbing down a ladder", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the man is \"climbing down a ladder\".", "chatgpt-answer": "C. climbing down a ladder", "video-llm-prediction": "A man is seen climbing down a ladder while wearing blue jeans and a blue shirt.", "gt-answer": "C. climbing down a ladder", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that a man is climbing a ladder while another man is climbing down. Since the man climbing down is moving in the opposite direction of the man climbing up, we can infer that the person is moving downwards.", "chatgpt-answer": "B. downwards", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing down. The man climbing down is wearing blue pants and blue shirt.", "gt-answer": "B. downwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is climbing up and down the ladder. This means that the person is moving vertically, either going up or going down. Since the description also mentions that the person is looking back at the camera, it indicates that the person is moving upwards while facing the camera.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man is seen climbing a ladder in a factory. He climbs up and down the ladder while looking back at the camera.", "gt-answer": "B. downwards", "rating": 0 }, { "chatgpt-reasoning": "The video description states that one man is climbing up the ladder while another man is climbing down. This indicates that the person is moving upwards.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man climbs a ladder while another man climbs down.", "gt-answer": "B. downwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that one man is climbing a ladder while another man is climbing downwards. It implies that the person is moving upwards.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing downwards.", "gt-answer": "B. downwards", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is shot in a time-lapse mode, which means it is sped up.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "A man is seen walking on a ladder while wearing blue jeans and a blue shirt. He climbs up the ladder while looking back at the camera. The video is shot in a time-lapse mode, and the man is seen climbing up the ladder at a normal speed. The video captures the man's movements as he climbs up the ladder, and the camera follows him from behind. The video ends with the man reaching the top of the ladder.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the actions and visuals in the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video depicts a man performing a dangerous stunt by climbing a metal ladder while wearing blue jeans and a blue shirt. He is seen climbing up the ladder while holding onto the metal bars, and he eventually reaches the top of the ladder. The video emphasizes the importance of safety and the potential risks associated with such stunts.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically states that it is a time-lapse video, which means the video is sped up to make the action appear faster than in reality.", "chatgpt-answer": "A. time-lapse", "video-llm-prediction": "A man is seen climbing a ladder in a time-lapse video.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is climbing up and down the ladder slowly and carefully, taking each step with caution. This indicates that the video is at normal speed.", "chatgpt-answer": "B. normal speed", "video-llm-prediction": "A man is seen climbing a ladder in a factory. He climbs up the ladder slowly and carefully, taking each step with caution. Once he reaches the top, he turns around and starts climbing back down. The video captures the man's movements as he climbs up and down the ladder, showcasing his physical abilities and determination.", "gt-answer": "B. normal speed", "rating": 1 } ] }, "1077590324": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the woman is seen \"doing laundry\" by putting clothes into a washing machine and then taking them out to hang them up.", "chatgpt-answer": "A. doing laundry", "video-llm-prediction": "A woman is seen doing laundry in a room. She is seen putting clothes into a washing machine and then taking them out to hang them up.", "gt-answer": "A. doing laundry", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is doing laundry, specifically putting clothes into a washing machine and then taking them out to hang them up.", "chatgpt-answer": "A. doing laundry", "video-llm-prediction": "A woman is seen doing laundry in a room. She is seen putting clothes into a washing machine and then taking them out to hang them up.", "gt-answer": "A. doing laundry", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the woman is doing laundry in a room.", "chatgpt-answer": "A. doing laundry", "video-llm-prediction": "A woman is seen doing laundry in a room.", "gt-answer": "A. doing laundry", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the woman is doing laundry and putting clothes into the washing machine.", "chatgpt-answer": "A. doing laundry", "video-llm-prediction": "A woman is seen doing laundry in a room. She is seen kneeling down in front of a washing machine and putting clothes into it.", "gt-answer": "A. doing laundry", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the video is shot in slow motion.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "A woman is seen kneeling down in front of a washing machine and putting clothes into it. She then proceeds to take out the clothes and hangs them up on a clothesline. The video showcases the woman's daily routine of washing clothes and hanging them up to dry. The video is shot in slow motion, giving the viewer a detailed view of the woman's actions. The video is shot in a well-lit room, and the woman is wearing casual clothes. The video is shot in a simple and straightforward manner, with no background music or sound effects. Overall, the video", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the actions and process of washing a garment using a washing machine.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A woman is seen kneeling down in front of a washing machine and putting a garment into the machine. She then proceeds to wash the garment by turning the knobs and pushing buttons. After the washing process is complete, she takes the garment out of the machine and hangs it up to dry. The video showcases the process of washing a garment using a washing machine.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Without any information about the speed, it is not possible to determine the correct answer.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen washing clothes in a sink. She then proceeds to wash the clothes in a washing machine.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen kneeling down in front of a washing machine and putting clothes into it. She then proceeds to turn the dials and begins washing the clothes.", "gt-answer": "B. normal speed", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "According to the video description, the woman is first seen sitting down and putting clothes into the washing machine. Then, she stands up and operates the washing machine. Therefore, the correct order of events is: B. Putting clothes into the washing machine and then standing up to operate the washing machine.", "chatgpt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "video-llm-prediction": "A woman is seen sitting down and putting clothes into a washing machine. She then stands up and operates the washing machine.", "gt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is sitting down and putting clothes into the washing machine first, and then she stands up to operate the washing machine.", "chatgpt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "video-llm-prediction": "A woman is seen sitting down and putting clothes into a washing machine. She then stands up and operates the washing machine.", "gt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman first sits down to operate the washing machine and then puts clothes into the machine.", "chatgpt-answer": "A. Sitting down to operate the washing machine and then putting clothes into the washing machine", "video-llm-prediction": "A woman is seen sitting down to operate a washing machine and then putting clothes into the machine.", "gt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is first seen sitting down and putting clothes into the washing machine. Then, she stands up and operates the washing machine.", "chatgpt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "video-llm-prediction": "A woman is seen sitting down and putting clothes into a washing machine. She then stands up and operates the washing machine.", "gt-answer": "B. Putting clothes into the washing machine and then standing up to operate the washing machine", "rating": 1 } ] }, "1040541401": { "action": [ { "chatgpt-reasoning": "The video description mentions that the children are engaged in various activities, including painting pictures, reading books, and doing chemical experiments. Soccer is not mentioned as one of the activities.", "chatgpt-answer": "A. painting pictures, B. reading books, C. doing chemical experiments", "video-llm-prediction": "The video shows a group of children in a classroom setting, with a man standing behind them. The children are engaged in various activities, including painting pictures, reading books, and doing chemical experiments. The man is seen interacting with the children, providing guidance and support. The video highlights the importance of education and the role of teachers in fostering a love for learning in children.", "gt-answer": "C. doing chemical experiments", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the children are mixing two liquids together and observing the changes in color, indicating that they are doing chemical experiments.", "chatgpt-answer": "C. doing chemical experiments", "video-llm-prediction": "In the video, a group of children is seen sitting at a table, with a man standing behind them. The man is seen pouring a liquid into a beaker and mixing it with another liquid. The children are then seen mixing the two liquids together and observing the changes in color. The video seems to be focused on teaching children about chemical reactions and the properties of different liquids. The man in the video appears to be a teacher or a guide, and he is explaining the process to the children. The setting of the video is not clear, but it seems to be a classroom or a laboratory. Over", "gt-answer": "C. doing chemical experiments", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the children are doing chemical experiments.", "chatgpt-answer": "C. doing chemical experiments", "video-llm-prediction": "The video shows a group of children doing chemical experiments with the help of a man.", "gt-answer": "C. doing chemical experiments", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that one child is mixing a blue liquid in a beaker, indicating that they are doing a chemical experiment. Additionally, the video mentions another child painting a picture and another child reading a book. Based on this information, we can conclude that the children are engaged in various activities including painting pictures, reading books, and doing chemical experiments.", "chatgpt-answer": "A. painting pictures, B. reading books, C. doing chemical experiments", "video-llm-prediction": "The video shows a group of children in a classroom, where they are engaged in various activities. One child is seen mixing a blue liquid in a beaker, while another is painting a picture. Additionally, a child is reading a book, and another is doing a science experiment. The video captures the children's curiosity and creativity as they explore the world around them.", "gt-answer": "C. doing chemical experiments", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description provides information about the activities happening in the video, but it does not mention anything about the speed of the video. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a group of children in a classroom, with a man standing behind them. The man is seen mixing a liquid in a beaker while the children watch. The children then take turns mixing the liquid and adding ingredients to a test tube. The man continues to mix the liquid while the children watch. The video ends with the man mixing the liquid one last time.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the activities happening in the video during a science experiment in a classroom. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a group of children in a classroom, with a man standing behind them. The man is seen mixing a liquid in a beaker while the children watch. The children then take turns mixing the liquid and adding ingredients to a test tube. The man then shows the children how to use a thermometer to check the temperature of the liquid. The children then take turns mixing the liquid again and adding ingredients to another test tube. The man then shows the children how to use a microscope to observe the liquid. Overall, the video depicts a science experiment being conducted in a class", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A man and two children are shown in a classroom, with the man pouring a liquid into a beaker and mixing it with a stirrer. The children are shown mixing the same liquid in their own beakers.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, there is no information provided about the speed of the video. The description only mentions the actions and events happening in the video, but does not specify anything about the speed at which these actions are occurring.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of children in a classroom, with a man standing next to them. The man is seen mixing a liquid in a beaker while the children watch. The children then take turns mixing the liquid and adding ingredients to a test tube. The video ends with the man mixing the contents of the test tube.", "gt-answer": "B. normal speed", "rating": 0 } ] }, "1059072773": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the ice cream is seen melting and dripping down the surface, and also freezing and solidifying.", "chatgpt-answer": "A. melting", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is seen melting and dripping down the surface. The video also shows the ice cream freezing and solidifying.", "gt-answer": "A. melting", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the ice cream goes through the process of melting, freezing, evaporating, and solidifying. Therefore, all of the options are correct.", "chatgpt-answer": "A. melting, B. freezing, C. evaporating, D. solidifying", "video-llm-prediction": "The video showcases the process of ice cream melting, freezing, evaporating, and solidifying. The video starts with a close-up shot of ice cream, which then transitions to a shot of the ice cream melting. The camera then pans out to show the ice cream freezing, and the video ends with a shot of the ice cream evaporating. The video provides a detailed look at the process of ice cream, from its melting to freezing and solidifying. The viewer can see the different stages of ice cream, from its melting to free", "gt-answer": "A. melting", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the ice cream is melting, which means it is changing from a solid state to a liquid state.", "chatgpt-answer": "A. melting", "video-llm-prediction": "A scoop of ice cream melts on a pink background.", "gt-answer": "A. melting", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the ice cream is going through the processes of melting, freezing, evaporating, and solidifying.", "chatgpt-answer": "A. melting", "video-llm-prediction": "The video showcases the process of ice cream melting, freezing, evaporating, and solidifying.", "gt-answer": "A. melting", "rating": 1 } ] }, "1064645467": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is seen wearing different clothing items, including shirts, jackets, and ties. This implies that he is getting dressed.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen wearing a suit and tie while standing in front of a park. He then proceeds to put on a black shirt and ties it up. After that, he puts on a black jacket and ties it up as well. He then proceeds to put on a white shirt and ties it up. Finally, he puts on a black tie and ties it up.", "gt-answer": "C. exercising", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is seen wearing a suit and tie, throwing a punch in the air, putting on his tie, and adjusting it. This sequence of actions suggests that the man is likely preparing for something rather than cooking, reading a book, or watching TV. Given the physical activity involved, the most appropriate choice is exercising.", "chatgpt-answer": "C. exercising", "video-llm-prediction": "A man is seen wearing a suit and tie, and he is seen throwing a punch in the air. He then proceeds to put on his tie and adjusts it. The man then walks away from the camera.", "gt-answer": "C. exercising", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is putting on a tie, which suggests that he is getting ready for an event or occasion. None of the other choices (cooking, reading a book, exercising, watching TV) are related to putting on a tie.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A man is seen putting on a tie while standing in front of a playground.", "gt-answer": "C. exercising", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is exercising in a park, doing push-ups and stretching his arms.", "chatgpt-answer": "C. exercising", "video-llm-prediction": "A man is seen exercising in a park while wearing a suit. He is seen doing push-ups and stretching his arms.", "gt-answer": "C. exercising", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the video is shot in slow motion.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video shows a man wearing a suit and tie who is seen adjusting his tie and jacket. He then proceeds to do arm exercises while looking off into the distance. The man is seen wearing a white shirt and black pants throughout the video. The video is shot in a park with trees and grass in the background. The man is seen wearing a watch on his left hand. The video is shot in slow motion, and the man is seen wearing a black jacket in some shots. The video ends with the man walking away from the camera.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention or provide any clues about the speed of the video. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man wearing a suit and tie, who is seen walking around a park and adjusting his tie. He then proceeds to put on his jacket and continues walking around the park. The video seems to be a casual stroll in the park, with the man dressed in formal attire. The man's actions of adjusting his tie and putting on his jacket suggest that he may be preparing for a formal event or just finished one. The park setting provides a peaceful and relaxing atmosphere, with the man enjoying the natural surroundings. Overall, the video captures a", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "From the video description, there is no mention of the video being in slow motion or time-lapse. The description simply states the actions of the man adjusting his tie and doing a handstand, without indicating any alteration in speed.", "chatgpt-answer": "C. normal speed", "video-llm-prediction": "A man in a suit is seen adjusting his tie in front of a playground. He then proceeds to do a handstand on a park bench.", "gt-answer": "C. normal speed", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man in a suit and tie adjusting his tie and then throwing it on a nearby bench.", "gt-answer": "C. normal speed", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description clearly states that the man is first seen jumping up to grab the bar, then putting on his jacket, and finally taking off his jacket before jumping up again to grab the bar.", "chatgpt-answer": "C. jumping up to grab the bar and then taking off his jacket", "video-llm-prediction": "A man is seen wearing a suit and tie, and he is seen jumping up to grab a bar. He then puts on his jacket and jumps up again to grab the bar. He then takes off his jacket and jumps up one last time to grab the bar.", "gt-answer": "D. taking off his jacket and then jumping up to grab the bar", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen putting on his jacket and then jumping up to grab a bar. He then takes off his jacket and jumps up to grab the bar again. This indicates that the correct order of events is B. putting on his jacket and then jumping up to grab the bar.", "chatgpt-answer": "B. putting on his jacket and then jumping up to grab the bar", "video-llm-prediction": "The video shows a man wearing a suit and tie who is seen putting on his jacket and then jumping up to grab a bar. He then takes off his jacket and jumps up to grab the bar again. The video seems to be showcasing the man's athletic abilities and his ability to multitask. The man's attire suggests that he is dressed for a formal event, and his actions demonstrate his strength and agility. The video is a great example of how one can combine physical activity with professional attire. Overall, the video is a great representation of how one can stay", "gt-answer": "D. taking off his jacket and then jumping up to grab the bar", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is first seen \"jumping up to grab a bar\" and then \"putting on his jacket\". This indicates that the man first performs the action of jumping up to grab the bar and then proceeds to put on his jacket.", "chatgpt-answer": "A. jumping up to grab the bar and then putting on his jacket", "video-llm-prediction": "A man is seen wearing a suit and tie, jumping up to grab a bar and then putting on his jacket.", "gt-answer": "D. taking off his jacket and then jumping up to grab the bar", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is first putting on his jacket and then jumping up to grab the bar.", "chatgpt-answer": "B. putting on his jacket and then jumping up to grab the bar", "video-llm-prediction": "A man is seen putting on his jacket and then jumping up to grab the bar.", "gt-answer": "D. taking off his jacket and then jumping up to grab the bar", "rating": 0 } ] }, "1088279109": { "direction": [ { "chatgpt-reasoning": "The video description states that the elevator is going up. This is consistent with the video showing the elevator moving up and down, indicating that it is indeed rising.", "chatgpt-answer": "A. rising", "video-llm-prediction": "The video shows an elevator going up and down, and it is consistent with the information that the elevator is going up. The other information is not consistent with the video.", "gt-answer": "A. rising", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the elevator is seen going up and down, and at one point, it is stationary. This implies that the elevator is both rising and going down.", "chatgpt-answer": "A. rising and B. going down", "video-llm-prediction": "The video showcases an elevator in a building, with a focus on its movement. The elevator is seen going up and down, and at one point, it is stationary. The video captures the elevator's ascent and descent, highlighting its functionality and purpose within the building.", "gt-answer": "A. rising", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the elevator is going up and down.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows an elevator going up and down.", "gt-answer": "A. rising", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the elevator is going up and down in a building, which means it is moving vertically.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows an elevator going up and down in a building.", "gt-answer": "A. rising", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is shot in slow motion, which means the movements in the video are slower than in real-time.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video shows a glass elevator inside a building. The camera pans around the elevator, and we can see the inside of the elevator. The video is shot in slow motion, and we can see the details of the elevator's interior. The video is shot from different angles, and we can see the entire elevator from the top to the bottom. The video is shot in a time-lapse, and we can see the entire elevator in a few seconds. The video is shot in a normal speed, and we can see the entire elevator in a few minutes. Overall, the video provides a", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video, so we cannot determine it based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video showcasing a glass elevator in a building with a glass wall. The video starts with a close-up of the elevator, and then it shows the entire elevator moving up and down. The video then shows the entire building, and the elevator is seen moving up and down. The video ends with a close-up of the elevator.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. It only describes the movement of an elevator up and down in a building. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of an elevator moving up and down in a building.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video is in slow motion.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "A video of a glass elevator moving up and down in a building is shown. The video is in slow motion, and the glass elevator is seen moving up and down in the building.", "gt-answer": "C. normal speed", "rating": 0 } ] }, "1093573255": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the plants are seen growing and changing over time, with the leaves becoming more vibrant and the plant growing taller. This indicates that the video is showing a condensed representation of time, which is characteristic of a time-lapse video.", "chatgpt-answer": "C. time-lapse", "video-llm-prediction": "The video showcases a white ceramic planter with green ivy plants in it. The plants are seen growing and changing over time, with the leaves becoming more vibrant and the plant growing taller. The video also includes a close-up shot of the plant, highlighting its texture and color. The video ends with a shot of the plant in the planter, showcasing its growth and beauty.", "gt-answer": "C. time-lapse", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the plant is seen swaying in the wind and the camera captures its movement. There is no mention of any time manipulation or alteration of speed in the video description.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a plant in a white pot, which is placed on a table. The plant is seen swaying in the wind, and the camera captures its movement. The video also features a close-up shot of the plant, highlighting its vibrant green color and intricate leaf patterns. The serene and calming sound of the wind adds to the peaceful ambiance of the video. Overall, the video provides a soothing and relaxing experience for the viewer.", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. Therefore, it is impossible to determine the speed based on the given description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A white pot with a plant in it is shown in the video.", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. There is no mention of slow motion or time-lapse in the description. Therefore, it can be assumed that the video is running at normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "A white pot with green leaves in it is shown in the video.", "gt-answer": "C. time-lapse", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the plant starts wilting but then revives and grows. This indicates that the plant goes through a process of wilting, followed by reviving and growing.", "chatgpt-answer": "D. growing", "video-llm-prediction": "The video shows a plant in a white pot that is wilting. However, the plant is then shown reviving and growing. The video also shows the plant in a brown pot, but it is not clear if this is the same plant or a different one. Overall, the video highlights the resilience of plants and their ability to bounce back from adversity.", "gt-answer": "B. reviving", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the plant is initially wilted but then revives and starts growing. This suggests that the plant is undergoing a process of wilting, reviving, and growing.", "chatgpt-answer": "D. growing", "video-llm-prediction": "The video showcases a plant in a white pot that is initially wilted but then revives and starts growing. The plant is seen in various positions, including in the corner of a room and on a table. The video highlights the plant's growth and revival, emphasizing the importance of taking care of plants and watching them grow.", "gt-answer": "B. reviving", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the plant is wilting, then reviving, and finally decaying. None of the choices of growing are mentioned in the video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A plant in a white pot is shown wilting, then reviving, and finally decaying.", "gt-answer": "B. reviving", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the plant is shown wilting, then reviving, and finally decaying.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A plant in a white pot is shown wilting, then reviving, and finally decaying.", "gt-answer": "B. reviving", "rating": 0 } ] }, "1105233293": { "action": [ { "chatgpt-reasoning": "The video description clearly mentions that a man in a yellow shirt is playing basketball on a court. Additionally, it states that he is seen dribbling the ball and then making a shot, which confirms that the people in the video are indeed playing basketball.", "chatgpt-answer": "C. playing basketball", "video-llm-prediction": "A man in a yellow shirt is playing basketball on a court. He is seen dribbling the ball and then making a shot. The crowd cheers as he runs back to the bench.", "gt-answer": "C. playing basketball", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that a man in a yellow shirt is playing basketball on a court. The description mentions that he is dribbling the ball and throwing it into the basket, which are actions commonly associated with playing basketball.", "chatgpt-answer": "C. playing basketball", "video-llm-prediction": "A man in a yellow shirt is playing basketball on a court. He is seen dribbling the ball and then throwing it into the basket. The crowd cheers as he makes the shot.", "gt-answer": "C. playing basketball", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a man in a yellow shirt shoots a basketball into the hoop while another man in a yellow shirt and white shorts runs towards him. This indicates that the people in the video are playing basketball.", "chatgpt-answer": "C. playing basketball", "video-llm-prediction": "A man in a yellow shirt shoots a basketball into the hoop while another man in a yellow shirt and white shorts runs towards him.", "gt-answer": "C. playing basketball", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a man in a yellow shirt is playing basketball on a court. He runs up to the basket, throws the ball, and high fives his teammates. All of these actions indicate that the people in the video are playing basketball.", "chatgpt-answer": "C. playing basketball", "video-llm-prediction": "A man in a yellow shirt is playing basketball on a court. He runs up to the basket and throws the ball, which goes in. He then runs back to the bench and high fives his teammates.", "gt-answer": "C. playing basketball", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is shot in a fast-motion effect, indicating that the pace of the video is accelerated.", "chatgpt-answer": "A. accelerated speed", "video-llm-prediction": "The video shows a basketball player dribbling the ball and then making a shot. The player is seen running towards the basket and throwing the ball into it. The video is shot in a fast-motion effect, and the player's movements are captured in detail. The video also shows the player's teammates celebrating the shot. The video is shot in a high-quality format, and the sound of the ball bouncing and the player's footsteps can be heard. Overall, the video showcases the player's skills and the excitement of the game.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any specific information about the pace of the video, such as whether it is in normal or accelerated speed, slow-motion, or reversed speed. Therefore, we cannot determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a basketball player dribbling the ball and making a shot. The player then runs towards the bench and hugs a man. The video captures the excitement and energy of the game, with the player's skillful dribbling and shooting, and the celebration of the successful shot. The video also highlights the camaraderie between the players and the supportive atmosphere of the game.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, there is no specific information regarding the pace of the video. The description only mentions that a basketball player shoots a ball into the basket while being watched by a crowd. However, it does not indicate whether the video is played at an accelerated speed, normal speed, reversed speed, or in slow-motion.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A basketball player shoots a ball into the basket while being watched by a crowd.", "gt-answer": "B. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the actions happening in the video, such as a basketball player shooting a ball into the basket and the crowd cheering. Therefore, we cannot determine the pace of the video based on the given description.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A basketball player wearing a yellow jersey shoots a ball into the basket while another player in a white jersey tries to block the shot. The player in yellow successfully shoots the ball into the basket, and the crowd cheers.", "gt-answer": "B. normal speed", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that the players are seen dribbling the ball and passing it to each other before one player shoots the ball into the basket. Therefore, the correct order of events is passing the ball to each other and then shooting the basketball.", "chatgpt-answer": "C. Passing the ball to each other and then shooting the basketball", "video-llm-prediction": "The video shows a group of basketball players playing on a court. They are seen dribbling the ball and passing it to each other. One player shoots the ball into the basket, and the others continue to play.", "gt-answer": "C. Passing the ball to each other and then shooting the basketball", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the players are seen dribbling the ball and passing it to each other, indicating that passing the ball comes before shooting the basketball. Therefore, the correct answer is C. Passing the ball to each other and then shooting the basketball.", "chatgpt-answer": "C. Passing the ball to each other and then shooting the basketball", "video-llm-prediction": "The video showcases a basketball game where players are seen dribbling the ball and passing it to each other. The game is intense, and the players are seen shooting the basketball while the crowd cheers them on. The video captures the players' skills and teamwork as they work together to score points.", "gt-answer": "C. Passing the ball to each other and then shooting the basketball", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the players are seen dribbling the ball and passing it to each other before shooting the basketball, indicating that passing the ball to each other happens before shooting the basketball.", "chatgpt-answer": "C. Passing the ball to each other and then shooting the basketball", "video-llm-prediction": "The video shows a group of players playing basketball on a court. They are seen dribbling the ball and passing it to each other before shooting the basketball.", "gt-answer": "C. Passing the ball to each other and then shooting the basketball", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the players are seen dribbling the ball and passing it to each other before shooting the basketball. This implies that passing the ball to each other comes before shooting the basketball.", "chatgpt-answer": "C. Passing the ball to each other and then shooting the basketball", "video-llm-prediction": "The video shows a group of players playing basketball on a court. They are seen dribbling the ball and passing it to each other before shooting the basketball. The players seem to be enjoying the game as they cheer and high-five each other. The video captures the energy and excitement of the game, with the players' movements and expressions adding to the overall atmosphere.", "gt-answer": "C. Passing the ball to each other and then shooting the basketball", "rating": 1 } ] }, "1077146132": { "action": [ { "chatgpt-reasoning": "The video description states that the woman wakes up in the middle of the night, tosses and turns in her bed, opens the curtains to let the sunlight in, stands there for a moment taking in the view, and then walks back to bed. Based on these actions, it can be concluded that the woman is waking up and briefly enjoying the view from the window before returning to bed.", "chatgpt-answer": "A. waking up", "video-llm-prediction": "A woman wakes up in the middle of the night and begins to toss and turn in her bed. She then gets up and walks over to a window, where she opens the curtains and lets the sunlight in. She stands there for a moment, taking in the view before turning away and walking back to bed.", "gt-answer": "A. waking up", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman wakes up in the middle of the night, tosses and turns in her bed, and then gets up to close the curtains. This implies that she initially wakes up, then moves around restlessly in her bed, and finally gets up to perform the action of closing the curtains.", "chatgpt-answer": "B. tossing and turning in the bed", "video-llm-prediction": "A woman wakes up in the middle of the night, tosses and turns in her bed, and then gets up to close the curtains.", "gt-answer": "A. waking up", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman wakes up in the middle of the night and walks to the window, opening the curtains to let the sunlight in. This indicates that the woman is waking up.", "chatgpt-answer": "A. waking up", "video-llm-prediction": "A woman wakes up in the middle of the night and walks to the window, opening the curtains to let the sunlight in.", "gt-answer": "A. waking up", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman wakes up in the middle of the night, tosses and turns in bed, and then falls back asleep. This indicates that she is going through a series of actions which include waking up, tossing and turning, and falling asleep again.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman wakes up in the middle of the night, tosses and turns in bed, and then falls back asleep.", "gt-answer": "A. waking up", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that the woman wakes up first and then gets out of bed. Only option A, \"Getting out of bed,\" matches this sequence of events.", "chatgpt-answer": "A. Getting out of bed", "video-llm-prediction": "A woman wakes up and gets out of bed, then she opens the curtains. She then closes the curtains and gets back onto the bed.", "gt-answer": "A. Getting out of bed", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the woman is getting out of bed first, indicating that it is the initial event in the sequence.", "chatgpt-answer": "A. Getting out of bed", "video-llm-prediction": "The video shows a woman getting out of bed and opening the curtains. She then closes the curtains and gets back onto the bed.", "gt-answer": "A. Getting out of bed", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman wakes up first, then gets out of bed, and finally opens the curtains. This means that \"Getting out of bed\" is the first event in the sequence.", "chatgpt-answer": "A. Getting out of bed", "video-llm-prediction": "A woman wakes up, gets out of bed, and opens the curtains.", "gt-answer": "A. Getting out of bed", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman wakes up before opening the curtains.", "chatgpt-answer": "A. Getting out of bed", "video-llm-prediction": "A woman wakes up and opens the curtains, then closes them and gets back into bed.", "gt-answer": "A. Getting out of bed", "rating": 1 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the woman is opening the curtains and walking away. This implies that more light is entering the room, so the video is turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video shows a woman standing in a room and opening the curtains. She then walks away from the curtains and turns around to face the camera. The video ends with the woman walking away.", "gt-answer": "C. turning brighter", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is seen opening the curtains and then closing them. It implies that there is a change in the lighting of the room when the curtains are opened and closed.", "chatgpt-answer": "B. turning darker", "video-llm-prediction": "The video shows a woman in a white shirt standing in front of a window. She is seen opening the curtains and then closing them. The video seems to be focused on the woman's actions in front of the window.", "gt-answer": "C. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a woman is opening the curtains of a window and letting the sunlight in. Opening the curtains and letting sunlight in indicates an increase in brightness.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video shows a woman opening the curtains of a window and letting the sunlight in.", "gt-answer": "C. turning brighter", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is opening the curtains, letting the sunlight in, and then closing the curtains. This indicates that there is a change in the amount of light entering the room.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video shows a woman opening the curtains of a window, letting the sunlight in, and then closing the curtains.", "gt-answer": "C. turning brighter", "rating": 1 } ] }, "1086688682": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the traffic light changes from red to green and then back to red. Although there is a mention of changing from red to yellow, it is mentioned that this information is not consistent with the video. Therefore, we can conclude that the correct answer is \"From red to green\".", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "The video shows a traffic light that changes from red to green and then back to red again. The video also includes a piece of information that says the traffic light changes from red to yellow. However, this information is not consistent with the video.", "gt-answer": "A. From red to green", "rating": 1 }, { "chatgpt-reasoning": "In the video description, it is mentioned that the traffic light changes \"from red to green, and then back to red again.\" This indicates that the change happening to the traffic lights is from red to green.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "The video showcases a traffic light that changes from red to green, and then back to red again. The camera captures the light from different angles, highlighting its color and movement. The video emphasizes the importance of traffic lights in maintaining order and safety on the roads.", "gt-answer": "A. From red to green", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the traffic light turns \"from red to green.\" This indicates a change from one color to another.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "A traffic light turns from red to green.", "gt-answer": "A. From red to green", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the traffic light changes from red to green.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "A traffic light is shown in the video, and it changes from red to green.", "gt-answer": "A. From red to green", "rating": 1 } ] }, "1096612823": { "action": [ { "chatgpt-reasoning": "The video description mentions that the car is seen sliding on ice, dancing on the rooftop, and driving on the road.", "chatgpt-answer": "A. sliding on ice", "video-llm-prediction": "The video shows a car driving on a winding road surrounded by trees. The car is seen sliding on ice, dancing on the rooftop, and driving on the road. The video captures the beauty of nature and the thrill of driving on a winding road.", "gt-answer": "D. driving on the road", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the car is seen sliding on ice, dancing on the rooftop, and driving on the road. This implies that the car's movement includes these actions.", "chatgpt-answer": "A. sliding on ice, B. dancing on the rooftop, D. driving on the road", "video-llm-prediction": "A car is seen sliding on ice, dancing on the rooftop, and driving on the road.", "gt-answer": "D. driving on the road", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions multiple scenarios involving different movements of the car. However, it does not provide specific information about the car's movement in any particular scene, such as sliding on ice, dancing on the rooftop, being buried in the sand, or driving on the road. Therefore, it is not possible to determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A car slides on ice, a car dances on the rooftop, a car is buried in the sand, and a car drives on the road.", "gt-answer": "D. driving on the road", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions multiple actions related to the car's movement, including sliding on ice, dancing on the rooftop, being buried in the sand, and driving on the road.", "chatgpt-answer": "A. sliding on ice, B. dancing on the rooftop, C. buried in the sand, D. driving on the road", "video-llm-prediction": "A car slides on ice, a car dances on the rooftop, a car is buried in the sand, and a car drives on the road.", "gt-answer": "D. driving on the road", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera captures the road from different angles, including a bird's eye view. This indicates that the camera is moving or changing its perspective. The final sentence also suggests that the video ends with a panoramic view of the surrounding landscape, which implies that the camera is zooming out to capture the larger view.", "chatgpt-answer": "A. zooming out", "video-llm-prediction": "The video showcases a winding road surrounded by trees and mountains. The camera captures the road from different angles, including a bird's eye view. The video also features a car driving down the road, and a person standing on the side of the road. The video ends with a panoramic view of the surrounding landscape.", "gt-answer": "D. zooming in", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the road and the car from different angles, including a bird's eye view from above. This suggests that the camera is moving to capture different perspectives, rather than zooming in or out, rotating, or panning left.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a winding road surrounded by trees and mountains. The camera captures the road from different angles, including a bird's eye view from above. The video also features a car driving down the road, and the camera captures the car from different angles. The video ends with a panoramic view of the surrounding landscape.", "gt-answer": "D. zooming in", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the road from different angles, including a bird's eye view. This indicates that the camera is moving or changing its perspective. Since none of the choices involve changing the camera angle, none of the choices are correct.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a winding road surrounded by trees and mountains. The camera captures the road from different angles, including a bird's eye view. The video also includes a shot of a car driving down the road.", "gt-answer": "D. zooming in", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the road from different angles, including a bird's eye view. This implies that the camera is moving to different positions to capture the road. The video ends with a shot of the road from a distance, which suggests that the camera is moving away or zooming out.", "chatgpt-answer": "A. zooming out", "video-llm-prediction": "The video showcases a winding road surrounded by trees and mountains. The camera captures the road from different angles, including a bird's eye view. The video also features a car driving down the road, and a person standing on the side of the road. The video ends with a shot of the road from a distance.", "gt-answer": "D. zooming in", "rating": 0 } ] }, "1075484900": { "direction": [ { "chatgpt-reasoning": "The video description states that the baby is looking at the camera and then turns away from the man. This indicates that the baby is initially facing towards the man and then turns away from him.", "chatgpt-answer": "B. Towards the man", "video-llm-prediction": "A man and a woman are holding a baby in their arms and smiling. The baby is looking at the camera and then turns away from the man. The man then kisses the baby on the forehead.", "gt-answer": "C. Turning away from the man", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the baby is looking at the camera and then looking away, indicating that the baby is facing the camera. Since the woman is holding the baby in front of the man, it can be inferred that the baby is also facing towards the man.", "chatgpt-answer": "B. Towards the man", "video-llm-prediction": "A woman is holding a baby in her arms and smiling. The baby is looking at the camera and then looking away. The woman is holding the baby in front of a man who is also smiling. The baby is then held by the woman and the man. The baby is then held by the woman and the baby is looking at the camera. The baby is then held by the woman and the baby is looking away. The baby is then held by the woman and the baby is looking at the camera. The baby is then held by the woman and the baby is looking away. The baby is then held by the woman and the", "gt-answer": "C. Turning away from the man", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the child is being held by the man first, indicating that the child is facing towards the man.", "chatgpt-answer": "B. Towards the man", "video-llm-prediction": "A man holds a baby while a woman smiles and talks to the baby. The baby is then held by the woman and the man.", "gt-answer": "C. Turning away from the man", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the baby is looking at the camera and then looking at the man. It also states that the baby is turned towards the woman. Therefore, the child is turning away from the man.", "chatgpt-answer": "C. Turning away from the man", "video-llm-prediction": "A man and a woman are holding a baby in their arms and smiling. The baby is looking at the camera and then looking at the man. The baby is then turned towards the woman.", "gt-answer": "C. Turning away from the man", "rating": 1 } ] }, "1090578917": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that the man is playing soccer on a field while a crowd watches.", "chatgpt-answer": "A. playing soccer", "video-llm-prediction": "A man is seen playing soccer on a field while a crowd watches.", "gt-answer": "A. playing soccer", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man is playing soccer on a field while wearing a yellow shirt. He is also seen kneeling down on the field and looking at the camera. This indicates that the man is engaged in playing soccer.", "chatgpt-answer": "A. playing soccer", "video-llm-prediction": "A man is seen playing soccer on a field while wearing a yellow shirt. He is also seen kneeling down on the field and looking at the camera.", "gt-answer": "A. playing soccer", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the man is playing soccer on a field.", "chatgpt-answer": "A. playing soccer", "video-llm-prediction": "A man playing soccer on a field.", "gt-answer": "A. playing soccer", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the man is playing soccer on a field.", "chatgpt-answer": "A. playing soccer", "video-llm-prediction": "A man is seen playing soccer on a field while wearing a yellow shirt.", "gt-answer": "A. playing soccer", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description states that the man is seen kneeling on the ground and then leaping to his right. This implies that he is first kneeling, then he leaps. There is no mention of him standing up in the video description. Therefore, option C is the correct answer.", "chatgpt-answer": "C. The man is leaping to his right and then standing up", "video-llm-prediction": "A man in an orange shirt is seen kneeling on the ground and then leaping to his right. He is wearing black socks and gloves. The video shows a soccer game being played in a stadium with a large crowd watching. The man is seen making a goal and then kneeling down.", "gt-answer": "C. The man is leaping to his right and then standing up", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is first seen kneeling on the ground and then standing up. It also mentions that he then leaps to his right and stands up again. Therefore, the correct order of events in the video is C. The man is leaping to his right and then standing up.", "chatgpt-answer": "C. The man is leaping to his right and then standing up.", "video-llm-prediction": "The video shows a man in an orange shirt and black shorts who is seen kneeling on the ground and then standing up. He then leaps to his right and stands up again. The man is seen wearing a glove on his hand. The video takes place in a field with a large crowd watching the man. The man is seen walking away from the field after the game.", "gt-answer": "C. The man is leaping to his right and then standing up", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is seen kneeling on the ground, then standing up, then leaping to his right, and finally standing up again. Option B (\"The man is standing up and then leaping to his right\") correctly matches this order of events.", "chatgpt-answer": "B. The man is standing up and then leaping to his right", "video-llm-prediction": "A man in an orange shirt is seen kneeling on the ground and then standing up. He then leaps to his right and stands up again.", "gt-answer": "C. The man is leaping to his right and then standing up", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is first seen kneeling on the ground and then leaping to his right. From this information, we can determine that the correct order of events is that the man is leaping to his right first and then standing up.", "chatgpt-answer": "C. The man is leaping to his right and then standing up", "video-llm-prediction": "The man is seen kneeling on the ground and then leaping to his right. He is wearing a yellow shirt and black shorts.", "gt-answer": "C. The man is leaping to his right and then standing up", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that the man is leaping to his left in front of a net, then he leaps backward and forward again. This indicates that the man is leaping in multiple directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen leaping to his left in front of a net. He then leaps backward and forward again.", "gt-answer": "D. to his right", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen leaping to his left, then backward, and finally forward.", "chatgpt-answer": "A. to his left", "video-llm-prediction": "A man in an orange shirt is seen leaping to his left, then backward, and finally forward. He is wearing black socks and gloves. The video shows him playing soccer on a field with a crowd watching.", "gt-answer": "D. to his right", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is leaping to his left and then backward.", "chatgpt-answer": "B. backward", "video-llm-prediction": "A man in an orange shirt leaps to his left and then backward.", "gt-answer": "D. to his right", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is leaping to his left and then backward.", "chatgpt-answer": "A. to his left", "video-llm-prediction": "A man in an orange shirt leaps to his left and then backward, all while wearing black socks.", "gt-answer": "D. to his right", "rating": 0 } ] }, "1075338140": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the ball is rolling from left to right and then rolls back to the left. It also mentions that the video showcases the ball's movement in different directions. Therefore, the correct answer is that the ball is rolling from left to right and right to left.", "chatgpt-answer": "D. rolling from right to left", "video-llm-prediction": "A silver ball is seen rolling from left to right on a pink surface. The ball then rolls back to the left and continues to roll forward again. The video showcases the ball's movement in different directions, including forward and backward, spinning in place, and rolling from left to right and right to left.", "gt-answer": "C. rolling from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the ball is seen rolling from left to right on a pink surface and then rolls back from right to left. This indicates that the direction of the ball changes from left to right to right to left.", "chatgpt-answer": "D. rolling from right to left", "video-llm-prediction": "A silver ball is seen rolling from left to right on a pink surface. The ball then rolls back from right to left.", "gt-answer": "C. rolling from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the ball rolls from left to right on a pink surface.", "chatgpt-answer": "C. rolling from left to right", "video-llm-prediction": "A ball rolls from left to right on a pink surface.", "gt-answer": "C. rolling from left to right", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the silver ball is rolling from left to right on a pink surface.", "chatgpt-answer": "C. rolling from left to right", "video-llm-prediction": "A silver ball is seen rolling from left to right on a pink surface.", "gt-answer": "C. rolling from left to right", "rating": 1 } ] }, "1067268403": { "direction": [ { "chatgpt-reasoning": "The video description specifically mentions that the wind turbines are stationary at first, then they start rotating in a clockwise direction and later in a counterclockwise direction.", "chatgpt-answer": "C. Rotating counterclockwise", "video-llm-prediction": "The video showcases a serene view of wind turbines situated in the ocean. The camera pans around the area, capturing the beauty of the landscape. The wind turbines are stationary, and the camera captures their position in the ocean. The video then transitions to show the wind turbines rotating in a clockwise direction, creating a mesmerizing view. The camera captures the movement of the wind turbines, highlighting their beauty. The video then shows the wind turbines rotating in a counterclockwise direction, creating a stunning visual effect. The camera captures", "gt-answer": "B. Rotating clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the wind turbines from different angles, highlighting their beauty and power. This suggests that the wind turbines are in motion.", "chatgpt-answer": "B. Rotating clockwise", "video-llm-prediction": "The video showcases a serene view of wind turbines situated near the ocean. The camera captures the wind turbines from different angles, highlighting their beauty and power. The sun sets in the background, casting a warm glow on the scene. The sound of the waves crashing against the shore can be heard in the background, adding to the calming atmosphere. The video ends with a shot of the sun setting, leaving the viewer with a sense of peace and tranquility.", "gt-answer": "B. Rotating clockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the wind turbines are stationary in the water. Therefore, they are not rotating in any direction.", "chatgpt-answer": "A. Stationary", "video-llm-prediction": "The video shows wind turbines stationary in the water.", "gt-answer": "B. Rotating clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the wind turbines are displayed in different positions, including stationary and rotating clockwise and counterclockwise.", "chatgpt-answer": "B. Rotating clockwise and C. Rotating counterclockwise", "video-llm-prediction": "A video showcases wind turbines in a serene environment. The video displays the turbines in different positions, including stationary and rotating clockwise and counterclockwise. The video highlights the beauty of the environment and the efficiency of the turbines.", "gt-answer": "B. Rotating clockwise", "rating": 0 } ] }, "1072594556": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the car is seen driving at different speeds, including slower than other cars and at the same speed as other cars. Since the question asks for the speed of the car in the center of the screen, we can infer that it is one of the cars mentioned in the video description. Therefore, the correct answer is option C - at the same speed as other cars.", "chatgpt-answer": "C. at the same speed as other cars", "video-llm-prediction": "The video shows a car driving down a busy city street with other cars around it. The car is seen driving at different speeds, including slower than other cars and at the same speed as other cars. The video also shows the car driving down the street at night.", "gt-answer": "B. faster than other cars", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the car in the center of the screen is seen driving at a slower pace than the other cars.", "chatgpt-answer": "A. slower than other cars", "video-llm-prediction": "The video showcases a car driving down a busy city street, surrounded by other cars. The car in the center of the screen is seen driving at a slower pace than the other cars. The video captures the bustling city life, with the car driving past tall buildings and palm trees. The car's movement is smooth and steady, and the camera angle captures the car's every movement. The video provides a glimpse into the daily life of a city, with the car driving through the busy streets, and the other cars driving at the same speed.", "gt-answer": "B. faster than other cars", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the car in the center of the screen is driving slower than the other cars.", "chatgpt-answer": "A. slower than other cars", "video-llm-prediction": "The video shows a car driving on a city street with other cars. The car in the center of the screen is driving slower than the other cars.", "gt-answer": "B. faster than other cars", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the car is driving down a busy city street, passing by other cars and pedestrians. It does not provide any specific information about the speed of the car or how it compares to other cars. Therefore, we cannot determine the speed of the car based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a car driving down a busy city street, passing by other cars and pedestrians.", "gt-answer": "B. faster than other cars", "rating": 0 } ] }, "1096007487": { "direction": [ { "chatgpt-reasoning": "Based on the video description, the circle is shown moving upward, downward, leftward, and rightward. However, the question specifically asks for the direction of the 3D cloud, not the circle. Since no information is given about the movement of the 3D cloud, it is not possible to determine its direction.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a circle with a pink background and a white outline of a circle. The circle is surrounded by a pink and blue gradient. The video also shows a pink and blue gradient with a white circle in the middle. The circle is shown moving upward, downward, leftward, and rightward. The video ends with a pink and blue gradient with a white circle in the middle.", "gt-answer": "C. leftward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the cloud is shown moving upward, downward, leftward, and rightward. This means that the cloud is moving in multiple directions, so none of the choices are correct.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a circle with a pink outline and a blue background, which is surrounded by a pink and blue cloud. The cloud is shown moving upward, downward, leftward, and rightward.", "gt-answer": "C. leftward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the cloud is moving upward.", "chatgpt-answer": "A. upward", "video-llm-prediction": "A cloud is shown moving upward in the video.", "gt-answer": "C. leftward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the cloud is shown moving upward. This indicates that the cloud is moving in the upward direction from the camera's point of view.", "chatgpt-answer": "A. upward", "video-llm-prediction": "A cloud is shown moving upward in the video.", "gt-answer": "C. leftward", "rating": 0 } ] }, "1095939659": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the light starts at the center and moves outwards in a circular motion. This implies that the light is growing in the outward direction.", "chatgpt-answer": "D. Upwards", "video-llm-prediction": "The video showcases a light that starts at the center and moves outwards in a circular motion. The light starts at the center and moves outwards in a circular motion.", "gt-answer": "B. Clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the light starts at the center and gradually moves outwards. This indicates that the light is growing or expanding in a specific direction.", "chatgpt-answer": "D. Upwards", "video-llm-prediction": "The video showcases a light that starts at the center and gradually moves outwards, creating a mesmerizing visual effect. The light's movement is accompanied by a captivating sound that adds to the overall experience. The video's purpose is to showcase the light's movement and the sound's harmony, creating a visually and aurally pleasing experience.", "gt-answer": "B. Clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the light is growing downwards.", "chatgpt-answer": "A. Downwards", "video-llm-prediction": "A light is shown growing downwards.", "gt-answer": "B. Clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the light is growing downwards.", "chatgpt-answer": "A. Downwards", "video-llm-prediction": "A light is shown growing downwards in the video.", "gt-answer": "B. Clockwise", "rating": 0 } ] }, "1059632327": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the tennis ball is bouncing up and down, spinning clockwise and anticlockwise, rolling forward and backward, and bouncing left to right on the court.", "chatgpt-answer": "All of the choices are correct.", "video-llm-prediction": "A tennis ball is seen bouncing up and down on a tennis court. The ball is then shown spinning clockwise and anticlockwise. The ball is then seen rolling forward and backward on the court. Finally, the ball is shown bouncing left to right on the court.", "gt-answer": "A. bouncing up and down", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the tennis ball is seen bouncing up and down, spinning clockwise and anticlockwise, and rolling forward and backward on the court. None of the choices mention all these movements correctly.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A tennis ball is seen bouncing up and down on a court. The ball is then shown spinning clockwise and anticlockwise, and rolling forward and backward. The video showcases the movement of the tennis ball on the court.", "gt-answer": "A. bouncing up and down", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the tennis ball is bouncing up and down on a tennis court.", "chatgpt-answer": "A. bouncing up and down", "video-llm-prediction": "A tennis ball is seen bouncing up and down on a tennis court.", "gt-answer": "A. bouncing up and down", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the tennis ball is bouncing up and down on a court. This indicates that the direction of the tennis ball is vertical, moving up and down.", "chatgpt-answer": "A. bouncing up and down", "video-llm-prediction": "A tennis ball is seen bouncing up and down on a court.", "gt-answer": "A. bouncing up and down", "rating": 1 } ] }, "1098785169": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the galaxy's rotation is showcased from various angles, including spinning counterclockwise, left to right, clockwise, and up and down. This suggests that the galaxy's spin can occur in any of these directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a beautiful and mesmerizing view of a galaxy spinning in the vastness of space. The camera captures the galaxy's rotation from various angles, highlighting its intricate structure and the vastness of the universe. The video provides a unique perspective of the galaxy's movement, with different directions of rotation, such as spinning counterclockwise, left to right, clockwise, and up and down. The video aims to inspire awe and wonder in the viewer, as they witness the beauty and complexity of the galaxy's rotation.", "gt-answer": "C. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the galaxy is spinning in different directions. However, it does not specifically mention whether the spin is clockwise or counterclockwise.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a beautiful and mesmerizing view of a galaxy spinning in the vastness of space. The camera captures the galaxy's movement, spinning in different directions, and the colors of the galaxy are vibrant and stunning. The video provides a sense of wonder and awe, as the camera pans around the galaxy, showcasing its intricate and complex structure. The video is a visual treat for anyone who loves astronomy and space exploration.", "gt-answer": "C. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the galaxy is spinning counterclockwise.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "A galaxy is shown spinning counterclockwise.", "gt-answer": "C. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the galaxy is spinning counterclockwise.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "A galaxy is shown spinning counterclockwise, with a bright light in the middle.", "gt-answer": "C. clockwise", "rating": 0 } ] }, "1099984801": { "direction": [ { "chatgpt-reasoning": "The video description mentions a time-lapse of the sky showcasing the movement of the clouds. However, the actual video content does not provide any information about the movement of the clouds.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range at night, with the stars twinkling above. The camera pans across the sky, capturing the beauty of the stars and the mountain range. The video also features a time-lapse of the sky, showcasing the movement of the clouds. The information provided is not consistent with the video content.", "gt-answer": "C. moving towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the clouds in the sky move in different directions, but it does not specify if they are moving away from the camera or towards the camera. Therefore, there is not enough information to determine the movement of the clouds.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with a clear blue sky. The camera pans around the mountain range, capturing the beauty of the snow-covered peaks and the vastness of the landscape. The clouds in the sky move in different directions, adding to the dynamic nature of the scene. The video is a perfect representation of the serene beauty of nature and the power of the mountains.", "gt-answer": "C. moving towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the clouds are moving away from the camera.", "chatgpt-answer": "A. moving away from the camera", "video-llm-prediction": "The video shows a beautiful view of the night sky with stars and a moon. The camera pans around the sky, and the clouds move away from the camera.", "gt-answer": "C. moving towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about clouds. It only mentions a beautiful night sky with a mountain range in the background, and that the camera pans around the sky capturing the stars and the mountain range. Since there is no information about the movement of the clouds, we cannot determine the correct answer from the given choices.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a beautiful night sky with a mountain range in the background. The camera pans around the sky, capturing the stars and the mountain range. The video ends with a shot of the mountain range.", "gt-answer": "C. moving towards the camera", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video includes a time-lapse effect, which allows the viewer to see the movement of the stars and the changing positions of the mountain range over time.", "chatgpt-answer": "C. time-lapse", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range at night, with the stars twinkling in the sky above. The camera pans around the mountain range, capturing the beauty of the snow-covered peaks and the vastness of the mountain range. The video also includes a time-lapse effect, which allows the viewer to see the movement of the stars and the changing positions of the mountain range over time. The video is a perfect representation of the beauty of nature and the awe-inspiring view of the mountain range at night.", "gt-answer": "C. time-lapse", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the entire video is shot in slow motion, which means that the speed of the video is slowed down.", "chatgpt-answer": "B. slow motion", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range at night, with the stars twinkling above. The camera captures the serene beauty of the landscape, with the snow-covered mountains and the starry sky providing a sense of tranquility. The video also features a time-lapse effect, which allows the viewer to witness the changing colors of the sky as the night progresses. The entire video is shot in slow motion, which allows the viewer to appreciate the details of the landscape. Overall, the video is a captivating display of the natural beauty of the world", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, there is no specific indication of the speed of the video. The description only mentions the visual elements such as the night sky, stars, moon, and snow-covered peaks.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a beautiful night sky with stars and a moon, and a mountain range with snow-covered peaks.", "gt-answer": "C. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there is a time-lapse of the stars moving across the sky, which suggests that the video is in time-lapse speed.", "chatgpt-answer": "C. time-lapse", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range at night, with the stars twinkling above. The camera pans over the mountains, capturing their majestic beauty. The video also features a time-lapse of the stars moving across the sky, adding to the overall awe-inspiring experience.", "gt-answer": "C. time-lapse", "rating": 1 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the sky is dark, indicating that the video is not getting brighter. It also does not mention any changes in the lighting conditions or any other elements that would suggest the video is getting darker. Therefore, the most reasonable answer is that the video is staying the same.", "chatgpt-answer": "A. staying the same", "video-llm-prediction": "The video showcases a breathtaking view of the night sky with a mountain range in the background. The sky is dark, and the stars are shining brightly, creating a serene and peaceful atmosphere. The camera pans around the sky, capturing the beauty of the stars and the vastness of the mountain range. The video ends with the camera focusing on the mountain range, leaving the viewer with a sense of awe and wonder.", "gt-answer": "B. getting darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video starts at night with stars twinkling above, and then ends with a shot of the mountain range at daybreak with the sun rising. This indicates a transition from darkness to brightness.", "chatgpt-answer": "C. getting brighter", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range at night, with the stars twinkling above. The camera pans around the mountain range, capturing the beauty of the snow-covered peaks and the vastness of the night sky. The video ends with a shot of the mountain range at daybreak, with the sun rising over the mountains and casting a warm glow over the snow.", "gt-answer": "B. getting darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sky gradually gets darker and brighter, indicating a change in brightness.", "chatgpt-answer": "C. getting brighter", "video-llm-prediction": "The video shows a beautiful night sky with stars and a moon. The sky gradually gets darker and brighter, and the stars twinkle in the dark.", "gt-answer": "B. getting darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the serene beauty of the landscape, with the snow-covered mountains and the starry sky providing a sense of tranquility and wonder. This implies that the scene is static and there is no change in brightness.", "chatgpt-answer": "A. staying the same", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range at night, with the stars twinkling in the sky above. The camera captures the serene beauty of the landscape, with the snow-covered mountains and the starry sky providing a sense of tranquility and wonder. The video is a perfect representation of the beauty of nature and the awe-inspiring view of the mountains at night.", "gt-answer": "B. getting darker", "rating": 0 } ] }, "1082419672": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the cruise ship is \"moving through the water\" and the camera is \"following its movement\". This indicates that the cruise ship is moving in a particular direction.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "The video showcases a large cruise ship sailing on the ocean. The camera captures the ship from different angles, highlighting its size and grandeur. The ship is seen moving through the water, with the camera following its movement. The video also includes a shot of the ship from above, showcasing its impressive structure. Overall, the video provides a stunning view of the cruise ship and its surroundings.", "gt-answer": "C. flying backwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the large cruise ship is seen sailing on the water, which indicates a forward movement.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "A large cruise ship is seen sailing on the water, with people on the deck enjoying the view. The ship is surrounded by a beautiful blue ocean, and the sky is clear and blue. The camera pans around the ship, showing the different areas of the deck, including the pool and the restaurants. The people on the ship are seen enjoying the sun and the sea breeze. The ship continues to sail on the water, with the sound of the waves and the wind in the background.", "gt-answer": "C. flying backwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a large cruise ship is \"sailing\" on the water. Sailing typically refers to the act of moving forward on water with the help of wind or engine power. None of the choices mention sailing specifically, but \"flying forwards\" seems to best capture the idea of movement in a forward direction.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "A large cruise ship is seen sailing on the water.", "gt-answer": "C. flying backwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the large cruise ship is seen sailing on the water and appears to be moving at a steady pace. There is no mention of hovering or flying, so the correct answer is the option that indicates movement on the water.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "A large cruise ship is seen sailing on the water, with a lighthouse visible in the background. The ship is surrounded by a vast blue ocean, and the sky is clear and blue. The camera captures the ship from different angles, showcasing its impressive size and design. The ship's sails are down, and it appears to be moving at a steady pace. The water is calm, and there are no visible waves or rough conditions. The lighthouse in the background adds to the serene and peaceful atmosphere of the scene. Overall, the video provides a beautiful and calming view", "gt-answer": "C. flying backwards", "rating": 0 } ] }, "1058985719": { "direction": [ { "chatgpt-reasoning": "The video description explicitly states that the airplane is flying from the bottom to the top of the sky.", "chatgpt-answer": "A. bottom to top", "video-llm-prediction": "A large airplane is seen flying from the bottom to the top of the sky, with the sun shining brightly in the background. The airplane is flying high in the sky, and the sun is shining brightly, creating a beautiful view. The sky is filled with clouds, and the sun is shining brightly, creating a beautiful view. The airplane is flying high in the sky, and the sun is shining brightly, creating a beautiful view. The sky is filled with clouds, and the sun is shining brightly, creating a beautiful view.", "gt-answer": "A. bottom to top", "rating": 1 }, { "chatgpt-reasoning": "The description mentions that the video showcases the airplane from different angles, including from below and above. This indicates that the airplane is flying in a vertical direction.", "chatgpt-answer": "C. top to bottom", "video-llm-prediction": "The video showcases a large airplane flying through the sky, with the sun shining through the clouds. The airplane is seen from different angles, including from below and above. The video captures the beauty of the sky and the airplane's journey through it.", "gt-answer": "A. bottom to top", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the plane is flying from bottom to top.", "chatgpt-answer": "A. bottom to top", "video-llm-prediction": "A plane is seen flying from bottom to top in the video.", "gt-answer": "A. bottom to top", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the plane is flying from bottom to top.", "chatgpt-answer": "A. bottom to top", "video-llm-prediction": "A plane is seen flying from bottom to top in the video.", "gt-answer": "A. bottom to top", "rating": 1 } ] }, "1055413730": { "direction": [ { "chatgpt-reasoning": "The video description explicitly mentions that the planet Earth is spinning rightwards, which is consistent with the information provided in the video.", "chatgpt-answer": "A. Rightwards", "video-llm-prediction": "The video shows a spinning globe of the Earth, with the words \"Earth\" and \"Spinning\" appearing on the screen. The video also includes a piece of information that says \"Spinning Rightwards,\" which is consistent with the video.", "gt-answer": "A. Rightwards", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions the directions in which the globe is spinning, with the text appearing on the screen. The video shows the globe spinning rightwards, then downwards, then leftwards, and finally upwards. Since the question asks about the direction in which the planet Earth is spinning, we can conclude that the correct answer is the opposite of the direction shown in the video. Therefore, the planet Earth is spinning.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a spinning globe, with the text \"Spinning Rightwards\" appearing on the screen. The globe is then shown spinning in the opposite direction, with the text \"Spinning Downwards\" appearing on the screen. The video then shows the globe spinning in the opposite direction once again, with the text \"Spinning Leftwards\" appearing on the screen. Finally, the video shows the globe spinning in the opposite direction one last time, with the text \"Spinning Upwards\" appearing on the screen.", "gt-answer": "A. Rightwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the planet Earth is spinning in a rightward direction.", "chatgpt-answer": "A. Rightwards", "video-llm-prediction": "A video of a spinning globe is presented, and the video shows the spinning of the globe in a rightward direction.", "gt-answer": "A. Rightwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the globe is spinning. Since there is no specific mention of the direction, we cannot determine the exact direction of the Earth's rotation based on the information provided in the video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a spinning globe, with the text \"A Spinning Globe\" appearing on the screen.", "gt-answer": "A. Rightwards", "rating": 0 } ] }, "1081684532": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the asteroids are flying away from the camera.", "chatgpt-answer": "A. flying away from the camera", "video-llm-prediction": "The video showcases a group of asteroids flying away from the camera, with some of them flying towards the camera. The video provides a mesmerizing view of the asteroids as they move in different directions. The consistent information with the video is that the asteroids are flying away from the camera. The other information is not consistent with the video.", "gt-answer": "C. flying towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the group of asteroids is \"flying away from the camera.\"", "chatgpt-answer": "A. flying away from the camera", "video-llm-prediction": "The video showcases a group of asteroids flying away from the camera, with each asteroid moving in a different direction. The camera captures the movement of the asteroids from different angles, providing a dynamic and engaging visual experience. The video highlights the beauty and complexity of the asteroid belt, as well as the vastness of space.", "gt-answer": "C. flying towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the asteroids are shown flying away from the camera.", "chatgpt-answer": "A. flying away from the camera", "video-llm-prediction": "A video of an asteroid field with a blue background and a black sky. The asteroids are shown flying away from the camera.", "gt-answer": "C. flying towards the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the asteroids are moving in different directions, specifically some flying away from the camera and others flying towards it. This means that the direction of the asteroids can be described as flying away from the camera or flying towards the camera.", "chatgpt-answer": "A. flying away from the camera or C. flying towards the camera", "video-llm-prediction": "A video showcases the movement of asteroids in different directions, with some flying away from the camera and others flying towards it.", "gt-answer": "C. flying towards the camera", "rating": 0 } ] }, "23391142": { "action": [ { "chatgpt-reasoning": "The video description mentions that a group of people is playing badminton in a gym, hitting the shuttlecock back and forth over the net. This indicates that the people in the video are playing badminton.", "chatgpt-answer": "B. playing badminton", "video-llm-prediction": "The video shows a group of people playing badminton in a gym. The players are seen hitting the shuttlecock back and forth over the net. The players are wearing different colored shirts, and the gym has a wooden floor. The video also shows a man in a red shirt walking in front of the players. The video ends with the players walking away from the camera.", "gt-answer": "B. playing badminton", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the people are playing badminton in a gymnasium, hitting the shuttlecock back and forth over the net.", "chatgpt-answer": "B. playing badminton", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The players are dressed in athletic clothing and seem to be enjoying the game. The gymnasium is well-lit and has a wooden floor. The players are hitting the shuttlecock with their rackets and the shuttlecock is seen flying through the air. The players are moving around the court, trying to keep the shuttlecock in play. The game continues for a while until the players take a break and walk around the court. Over", "gt-answer": "B. playing badminton", "rating": 1 }, { "chatgpt-reasoning": "The video description states clearly that a group of people are playing badminton in a gym.", "chatgpt-answer": "B. playing badminton", "video-llm-prediction": "A group of people are playing badminton in a gym.", "gt-answer": "B. playing badminton", "rating": 1 }, { "chatgpt-reasoning": "The video description states that a group of people are playing badminton in a gymnasium.", "chatgpt-answer": "B. playing badminton", "video-llm-prediction": "A group of people are playing badminton in a gymnasium.", "gt-answer": "B. playing badminton", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description does not mention anything about the camera panning in any particular direction. Therefore, we cannot determine the direction of the video panning based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The video also shows a man in a red shirt walking around the court while the game is being played. The video ends with the players walking away from the court.", "gt-answer": "D. To the right", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the direction in which the video is panning. There is no information provided to determine the correct answer.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The game continues with the players hitting the shuttlecock with their rackets. The players seem to be enjoying the game as they continue to play. The gymnasium is well-lit, and the walls are painted in a light blue color. The players are wearing athletic clothing, and the shuttlecock is white in color. The game continues for some time, and the players seem to be evenly matched. Overall, the video capt", "gt-answer": "D. To the right", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the panning direction. Therefore, we cannot determine the panning direction based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A man in a red shirt is playing tennis with a woman in a pink shirt. They are hitting the ball back and forth over the net.", "gt-answer": "D. To the right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video captures the players' movements as they move around the court, trying to outmaneuver their opponents. This implies that the camera is following the players' movements, panning from one side of the court to another.", "chatgpt-answer": "D. To the right", "video-llm-prediction": "The video shows a group of people playing badminton in a gym. The players are seen hitting the shuttlecock back and forth over the net. The video captures the players' movements as they move around the court, trying to outmaneuver their opponents. The players' skills are evident as they hit the shuttlecock with precision and speed. The gym provides a spacious area for the players to move around freely. The video captures the excitement and energy of the game, making it an enjoyable watch for anyone interested in badminton.", "gt-answer": "D. To the right", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is shot in a fast-motion style.", "chatgpt-answer": "C. time-lapse", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The video also shows a man in a red shirt and black shorts walking around the court. The players are wearing different colored shirts, and the gymnasium has a wooden floor. The video is shot in a fast-motion style, and the players are seen hitting the shuttlecock with their rackets. The video ends with the players walking around the court.", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, there is no mention of the speed of the video. The description only provides details about the environment, the players' actions, their clothing, and the appearance of the shuttlecock. Since there is no information regarding the speed of the video, it is not possible to determine whether it is in normal speed, slow motion, or time-lapse.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The game continues with the players hitting the shuttlecock with their rackets. The players seem to be enjoying the game as they continue to play. The gymnasium is well-lit, and the walls are painted in a light blue color. The players are wearing athletic clothing, and the shuttlecock is white in color. The video captures the players' movements as they move around the court, hitting the shuttlecock with their", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. However, based on the description that the video captures the players' movements and the sound of the shuttlecock hitting the rackets, it is likely that the video is in normal speed to accurately show the players playing badminton.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The video captures the players' movements and the sound of the shuttlecock hitting the rackets.", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any changes in the speed of the video, so it can be assumed that the video is in normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video shows a group of people playing badminton in a gym. The players are seen hitting the shuttlecock back and forth over the net. The video captures the players' movements as they run around the court, trying to keep up with the shuttlecock. The players seem to be having a good time, and the gym provides a spacious area for them to play. The video is shot in a well-lit area, and the sound of the shuttlecock hitting the rackets can be heard throughout the video. Overall, the video showcases a fun and active game of", "gt-answer": "B. slow motion", "rating": 0 } ] }, "1078368947": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the woman is sitting in a bathtub, reading a book. It also mentions that the woman appears to be enjoying her time in the tub and that the sound of water can be heard in the background. All these details indicate that the woman is taking a bath and reading a book at the same time.", "chatgpt-answer": "C. reading a book while taking a bath", "video-llm-prediction": "A woman is seen sitting in a bathtub, reading a book. She appears to be enjoying her time in the tub, and the sound of the water can be heard in the background. The woman seems to be relaxed and at ease, and the book she is reading appears to be a romance novel. The lighting in the room is dim, and the woman's hair is wet from the water. The bathtub is large and spacious, and the woman is sitting comfortably in it. Overall, the video captures a peaceful and serene moment of a woman enjoying a relax", "gt-answer": "C. reading a book while taking a bath", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is taking a bath and reading a book. She is also washing her face while in the bath.", "chatgpt-answer": "C. reading a book while taking a bath", "video-llm-prediction": "A woman is seen taking a bath while reading a book. She is also seen washing her face while in the bath.", "gt-answer": "C. reading a book while taking a bath", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the woman is taking a bath while reading a book. This indicates that she is engaged in both activities simultaneously.", "chatgpt-answer": "C. reading a book while taking a bath", "video-llm-prediction": "A woman is seen taking a bath while reading a book.", "gt-answer": "C. reading a book while taking a bath", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically mentions that the woman is taking a bath while reading a book. It also mentions that she is washing her face while in the tub. Based on this information, the correct answer is C. reading a book while taking a bath.", "chatgpt-answer": "C. reading a book while taking a bath", "video-llm-prediction": "A woman is seen taking a bath while reading a book. She is also seen washing her face while in the tub.", "gt-answer": "C. reading a book while taking a bath", "rating": 1 } ] }, "1099738787": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the concrete wall is melting, falling apart, and growing taller. However, none of the choice candidates accurately represent all three actions happening to the wall. The wall is not fully melting or falling apart, nor is it simply growing taller. Therefore, none of the choices accurately describe what is happening to the wall.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a concrete wall that is melting, falling apart, and growing taller. The information that is consistent with the video is that the wall is made of concrete.", "gt-answer": "B. falling apart", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the concrete wall is both melting and falling apart. Although the video does not mention anything about the wall growing taller, it explicitly mentions that the wall eventually collapses, which suggests that it is not growing taller.", "chatgpt-answer": "B. falling apart", "video-llm-prediction": "The video showcases a concrete wall that is melting and falling apart, but it also grows taller. The video highlights the process of the wall's deterioration and the eventual collapse of the structure.", "gt-answer": "B. falling apart", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the concrete wall is melting and falling apart.", "chatgpt-answer": "A. melting", "video-llm-prediction": "A concrete wall is shown melting and falling apart.", "gt-answer": "B. falling apart", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the concrete wall is melting, falling apart, and growing taller.", "chatgpt-answer": "A. melting, B. falling apart, C. growing taller", "video-llm-prediction": "A concrete wall is shown melting, falling apart, and growing taller.", "gt-answer": "B. falling apart", "rating": 0 } ] }, "1094219575": { "speed": [ { "chatgpt-reasoning": "From the video description, there are no indications that the video is playing at a different speed than normal. The description only mentions different shots and angles of the flower, which suggests a regular pace.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a white flower in various stages of bloom, from bud to full bloom. The camera captures the flower from different angles, highlighting its beauty and grace. The video starts with a close-up of the flower, and then transitions to a wider shot, showcasing the flower in its natural environment. The camera then zooms out, providing a broader perspective of the flower and its surroundings. Throughout the video, the flower is shown in different positions, from standing upright to swaying in the wind. The video ends with a close-up shot of the flower", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video is shot in a time-lapse manner and in a slow motion manner.", "chatgpt-answer": "B. time-lapse", "video-llm-prediction": "The video showcases a beautiful white flower with a pink center, which is the main subject. The video starts with a close-up shot of the flower, and then it pans out to show the entire flower. The camera then zooms in on the flower, and the video ends with a close-up shot of the flower. The video is shot in a black background, and the flower is the only object in the frame. The video is shot in a time-lapse manner, and the flower is shown in different stages of bloom. The video is shot in a slow motion manner, and the flower is shown in", "gt-answer": "B. time-lapse", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a flower is blooming. Blooming is a slow process that usually takes time, so it is likely that the video is in time-lapse mode, showing the process at an accelerated speed.", "chatgpt-answer": "B. time-lapse", "video-llm-prediction": "A video of a flower blooming is shown.", "gt-answer": "B. time-lapse", "rating": 1 }, { "chatgpt-reasoning": "Based on the description of the video, it mentions that the video starts with a close-up of the flower, then pans out to show the entire flower, zooms in on the flower again, and pans out to show the entire flower once more. This description suggests that the video is showing normal speed transitions between these shots.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "A video showcasing a white flower in a black background. The video starts with a close-up of the flower, and then it pans out to show the entire flower. The video then zooms in on the flower again, and the camera pans out to show the entire flower once more. The video ends with a close-up of the flower.", "gt-answer": "B. time-lapse", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the flower is shown in various stages of blooming, including its initial stages, full bloom, and wilted state. This indicates that the flowers are going through a process of blooming and then wilting.", "chatgpt-answer": "C. blooming, D. wilting", "video-llm-prediction": "The video showcases a beautiful white flower that is initially shown in a close-up shot. The camera then pans out to reveal the flower in a larger context. The flower is shown in various stages of blooming, including its initial stages, full bloom, and wilted state. The video highlights the beauty and delicacy of the flower, showcasing its intricate details and delicate petals. The video also emphasizes the flower's natural beauty, highlighting its vibrant colors and unique patterns. Overall, the video provides a captivating and visually stunning experience,", "gt-answer": "D. wilting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the flower goes through different stages, from growing taller and changing color to eventually wilting. Therefore, all of the choices are correct.", "chatgpt-answer": "A. growing taller, B. changing color, C. blooming, D. wilting", "video-llm-prediction": "The video showcases the process of a flower blooming, starting with a close-up shot of a single flower and then transitioning to a series of shots showing the flower growing taller and changing color. The video highlights the beauty and complexity of the flower's life cycle, from its initial stages of growth to its eventual bloom. The final shot of the video shows the flower wilting, emphasizing the fleeting nature of beauty and the inevitability of change.", "gt-answer": "D. wilting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the white flower blooms and wilts. Blooming refers to the process of a flower opening and blossoming, while wilting refers to the process of a flower losing its freshness and drooping. Therefore, the correct answer is D. wilting.", "chatgpt-answer": "D. wilting", "video-llm-prediction": "A white flower blooms and wilts in a black background.", "gt-answer": "D. wilting", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the flower is blooming and wilting. This means that the flower is going through a process where it opens up and then starts to wither.", "chatgpt-answer": "D. wilting", "video-llm-prediction": "A white flower blooms and wilts in a black background.", "gt-answer": "D. wilting", "rating": 1 } ] }, "1053758117": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the video starts with a zoom out from a 3D digital brain, then zooms in on the brain, and finally provides a detailed view of its various components.", "chatgpt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "The video starts with a zoom out from a 3D digital brain, which is the main subject of the video. The camera then zooms in on the brain, providing a closer look at its intricate structure. The video then shows a person standing still before a 3D digital brain, which could be interpreted as a representation of the brain's complexity. Finally, the video zooms in on the brain, providing a detailed view of its various components. Overall, the video showcases the beauty and complexity of the human brain.", "gt-answer": "C. Zoom into a 3D digital brain", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video begins with a zoomed-out view of the brain, then zooms in to provide a closer look at the intricate details of the brain, and finally zooms out again.", "chatgpt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "The video showcases a 3D digital brain that is zoomed in on and then zoomed out from. The video begins with a zoomed-out view of the brain, and then zooms in to provide a closer look at the intricate details of the brain. The video then zooms out again, providing a broader perspective of the brain. The video is a fascinating exploration of the human brain and its complexities.", "gt-answer": "C. Zoom into a 3D digital brain", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a 3D digital brain is shown in the video. There is no information given about zooming out or standing still, but it specifically states that the brain is being shown. This implies that there is an action happening related to the brain.", "chatgpt-answer": "C. Zoom into a 3D digital brain", "video-llm-prediction": "A 3D digital brain is shown in the video.", "gt-answer": "C. Zoom into a 3D digital brain", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically states that the video is showing a 3D digital brain zooming out from a close-up shot.", "chatgpt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "A 3D digital brain is shown in the video, zooming out from a close-up shot.", "gt-answer": "C. Zoom into a 3D digital brain", "rating": 0 } ] }, "1069717165": { "order": [ { "chatgpt-reasoning": "The video description states that the woman is seen nodding her head and shaking her head repeatedly. This indicates that she arranges her head movements by nodding and shaking her head repeatedly.", "chatgpt-answer": "A. nodding and shaking her head repeatedly", "video-llm-prediction": "A woman with blonde hair is seen in a white sweater. She is seen nodding her head and shaking her head repeatedly. The video seems to be a close-up shot of the woman's face. The woman's facial expressions are the main focus of the video. The video seems to be a simple yet effective way to showcase the woman's emotions. The video is shot in a way that makes the viewer feel like they are right there with the woman. Overall, the video is a simple yet effective way to showcase the woman's emotions.", "gt-answer": "B. shaking her head, followed by nodding her head", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is \"nodding and shaking her head repeatedly\".", "chatgpt-answer": "A. nodding and shaking her head repeatedly", "video-llm-prediction": "The video features a woman who is seen nodding and shaking her head repeatedly. She appears to be in a state of distress or discomfort. The woman's facial expressions and body language suggest that she is experiencing some form of emotional turmoil. The video captures the woman's emotional state in a raw and unfiltered way, allowing the viewer to witness her struggle firsthand. The woman's actions are the central focus of the video, and the camera captures her movements in detail, providing a close-up view of her emotional state. Overall, the video", "gt-answer": "B. shaking her head, followed by nodding her head", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is \"nodding and shaking her head repeatedly.\" This means that she is performing both actions simultaneously or in quick succession.", "chatgpt-answer": "A. nodding and shaking her head repeatedly", "video-llm-prediction": "A woman with blonde hair is seen nodding and shaking her head repeatedly.", "gt-answer": "B. shaking her head, followed by nodding her head", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is first seen smiling and nodding her head. Then, she shakes her head and nods her head repeatedly. Therefore, the correct arrangement of her head movements is shaking her head, followed by nodding her head.", "chatgpt-answer": "B. shaking her head, followed by nodding her head", "video-llm-prediction": "A woman with blonde hair is seen smiling and nodding her head. She then shakes her head and nods her head repeatedly.", "gt-answer": "B. shaking her head, followed by nodding her head", "rating": 1 } ] }, "1041584314": { "order": [ { "chatgpt-reasoning": "The video description states that the man starts by smiling, then shows a serious expression, and finally smiles again. None of the other options match this sequence.", "chatgpt-answer": "B. Smiling, then showing a serious expression", "video-llm-prediction": "The video features a man who is seen smiling and then showing a serious expression. He then smiles again. The video seems to be a simple one, with no other significant events or actions taking place.", "gt-answer": "C. Showing a serious expression, then smiling", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen smiling and then showing a serious expression, followed by smiling again. This implies that the man's expression changes from smiling to showing a serious expression, and then back to smiling.", "chatgpt-answer": "C. Showing a serious expression, then smiling", "video-llm-prediction": "The man in the video is seen smiling and then showing a serious expression. He then smiles again.", "gt-answer": "C. Showing a serious expression, then smiling", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man's expression changes from smiling to showing a serious expression.", "chatgpt-answer": "B. Smiling, then showing a serious expression", "video-llm-prediction": "The man in the video is seen smiling and then showing a serious expression.", "gt-answer": "C. Showing a serious expression, then smiling", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man starts by smiling, then shows a serious expression, and finally smiles again. Therefore, the correct answer is B. Smiling, then showing a serious expression.", "chatgpt-answer": "B. Smiling, then showing a serious expression", "video-llm-prediction": "The man in the video is seen smiling and then showing a serious expression. He then smiles again.", "gt-answer": "C. Showing a serious expression, then smiling", "rating": 0 } ] }, "1067427023": { "speed": [ { "chatgpt-reasoning": "Based on the video description, there is no specific mention of the speed of the video. However, since the description mentions the camera capturing the person's movements as they walk through the snow, it can be inferred that the video is most likely in normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a snowy field with a close-up shot of the snow. The camera then pans out to show the entire field covered in snow. The video then shows a person walking through the snowy field. The camera captures the person's movements as they walk through the snow. The video ends with a shot of the snowy field.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the video showcases a snowy field with a person walking through it. The camera pans around the field, capturing the beauty of the snow-covered landscape. There is no mention of any special effects or changes in speed. Therefore, we can assume that the video is shown at normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a snowy field with a close-up of the snow, followed by a person walking through the snowy field. The camera then pans around the snowy field, capturing the beauty of the snow-covered landscape. The video highlights the serene and peaceful atmosphere of the snowy field, with the sound of crunching snow underfoot adding to the immersive experience. The snowy field is a perfect setting for a winter wonderland, and the video captures the essence of the season.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the field and we can see the snow falling from the sky. This suggests that the video is in normal speed, capturing real-time movement.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video shows a snowy field with a lot of snow on the ground. The camera pans around the field, and we can see the snow falling from the sky.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. As a result, it is impossible to determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a snowy landscape with a focus on the snow-covered grass. The camera pans around the area, capturing the beauty of the snow-covered grass.", "gt-answer": "B. time-lapse", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the snow particles are melting, condensing, and solidifying. \"Melting\" refers to the process of changing from a solid state to a liquid state, \"condensing\" refers to the process of changing from a gas state to a liquid state, and \"solidifying\" refers to the process of changing from a liquid state to a solid state. Since the video captures all these transformations, the correct answer is:", "chatgpt-answer": "A. solidifying", "video-llm-prediction": "The video shows a close-up of snow particles melting and condensing. The snow particles are seen melting and condensing, and the video captures the process of melting and condensing. The video also shows the snow particles solidifying, indicating that they are freezing. The video provides a detailed view of the snow particles and their behavior in different conditions.", "gt-answer": "B. melting", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the snow particles are melting and solidifying.", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of snow melting and solidifying. The snow particles are seen melting and solidifying, and the video captures the transformation of the snow from a solid to a liquid state and vice versa. The video provides a visual representation of the process of snow melting and solidifying, highlighting the changes in the snow's state.", "gt-answer": "B. melting", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the snow particles are melting and solidifying. This means that the snow particles are changing from a solid state to a liquid state (melting) and then changing from a liquid state back to a solid state (solidifying). None of the choices can capture this complete transformation.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows snow particles melting and solidifying.", "gt-answer": "B. melting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the snow particles are melting and solidifying. The process of melting involves the transformation from a solid state to a liquid state, while solidifying is the reverse process, transforming from a liquid state to a solid state. Therefore, both A. solidifying and B. melting describe the transformation happening to the snow particles.", "chatgpt-answer": "A. solidifying and B. melting", "video-llm-prediction": "The video showcases the process of snow particles melting and solidifying. The video starts with a close-up shot of snow particles, which then transitions to a wider shot of the snow-covered ground. The camera then zooms in on the snow particles, highlighting their melting process. The video then shows the snow particles solidifying, with the camera capturing the process from different angles. The video ends with a shot of the snow-covered ground, emphasizing the beauty of the snowy landscape.", "gt-answer": "B. melting", "rating": 0 } ] }, "1093948229": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the golden particles are seen exploding and scattering. It also states that the particles are shown to be shrinking and disappearing. Therefore, both options C and D (scattering and exploding) can be inferred from the video description.", "chatgpt-answer": "C. scattering and D. exploding", "video-llm-prediction": "The video showcases a close-up of golden particles that are seen exploding and scattering. The particles are shown to be shrinking and disappearing, creating a mesmerizing visual effect. The video captures the beauty of the particles as they interact with each other, creating a stunning display of light and color. The sound of the particles exploding and scattering adds to the immersive experience, making it feel like you are right there with them. Overall, the video is a captivating display of the natural beauty of the world around us.", "gt-answer": "D. exploding", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the golden particles are seen exploding and scattering in different directions. Additionally, it states that the particles are seen shrinking and disappearing. Both of these descriptions indicate that the golden particles are both exploding and disappearing.", "chatgpt-answer": "D. exploding", "video-llm-prediction": "The video showcases a container filled with golden particles that are seen exploding and scattering in different directions. The particles are seen shrinking and disappearing, leaving behind a cloud of dust. The video captures the particles in various positions, including in the air and on the ground. The sound of the explosion and the movement of the particles can be heard, adding to the immersive experience. Overall, the video provides a mesmerizing display of the golden particles and their various movements.", "gt-answer": "D. exploding", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the golden particles are exploding.", "chatgpt-answer": "D. exploding", "video-llm-prediction": "A video of golden particles that are shown to be exploding.", "gt-answer": "D. exploding", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the golden particles are exploding and scattering in various directions.", "chatgpt-answer": "D. exploding", "video-llm-prediction": "A video showcases a container filled with golden particles that are seen exploding and scattering in various directions.", "gt-answer": "D. exploding", "rating": 1 } ] }, "1106668103": { "direction": [ { "chatgpt-reasoning": "The video description mentions that coffee beans are ground up, mixed together, and then poured into a cup. This implies a sequence of movements, indicating that there is movement in the video.", "chatgpt-answer": "B. moving forward", "video-llm-prediction": "The video showcases a close-up of coffee beans, which are then ground up and mixed together. The resulting coffee is then poured into a cup and enjoyed by the viewer.", "gt-answer": "B. moving forward", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention any specific direction of movement. It only describes the camera panning from a close-up of coffee beans to a larger group, and then to the entire group of coffee beans. This indicates that the movement is primarily from a close-up perspective to a wider view, but it doesn't specify if it's moving forward or backward.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a close-up of coffee beans, with a focus on their texture and appearance. The camera then pans out to reveal a larger group of coffee beans, emphasizing their abundance and variety. The video concludes with a shot of the entire group of coffee beans, highlighting their collective beauty and the vastness of the coffee bean world.", "gt-answer": "B. moving forward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera is panning back and forth, which indicates movement. None of the choices mention movement, so none of them are correct.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of coffee beans is shown, and the camera pans back and forth.", "gt-answer": "B. moving forward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the coffee beans are ground up and mixed together. This indicates movement and activity in the video, so the correct answer would be \"B. moving forward\".", "chatgpt-answer": "B. moving forward", "video-llm-prediction": "The video showcases a close-up of coffee beans, which are then ground up and mixed together. The resulting mixture is then poured into a cup and stirred with a spoon. The video ends with a shot of the coffee being poured into a mug.", "gt-answer": "B. moving forward", "rating": 1 } ] }, "1049965795": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the light bulb is turned off and then shown breaking. This indicates that the light bulb is breaking.", "chatgpt-answer": "B. breaking", "video-llm-prediction": "The video shows a close-up of a light bulb, which is then turned off. The light bulb is then shown breaking, and the video ends.", "gt-answer": "C. light up", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the light bulb is initially turned off, and then it is shown rapidly changing colors. This indicates that the light bulb is not breaking or lighting up, but actually going through a process of rapidly changing colors.", "chatgpt-answer": "D. rapidly changing color", "video-llm-prediction": "The video showcases a close-up of a light bulb, which is then turned off. The camera then pans out to reveal the entire bulb. The video then shows the bulb rapidly changing colors, which is a fascinating sight to behold. The video is a great example of how light bulbs can be used to create stunning visual effects.", "gt-answer": "C. light up", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the light bulb is turned off.", "chatgpt-answer": "A. turning off", "video-llm-prediction": "A light bulb is shown in a dark room, and it is turned off.", "gt-answer": "C. light up", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the light bulb is turned off.", "chatgpt-answer": "A. turning off", "video-llm-prediction": "A light bulb is shown in a dark room, and it is turned off.", "gt-answer": "C. light up", "rating": 0 } ] }, "1052364490": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the digital bar chart starts small and gradually grows in size. It also mentions that the chart stays in the same size. Therefore, the correct answer is that the digital bar chart is staying in the same size.", "chatgpt-answer": "A. staying in the same size", "video-llm-prediction": "The video features a digital bar chart that starts small and gradually grows in size. The video also includes a piece of information that states the chart stays in the same size.", "gt-answer": "B. growing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the digital bar chart starts small and gradually grows in size, emphasizing the importance of staying in the same size and not shrinking.", "chatgpt-answer": "B. growing", "video-llm-prediction": "The video showcases a digital bar chart that starts small and gradually grows in size. The video emphasizes the importance of staying in the same size and not shrinking.", "gt-answer": "B. growing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the digital bar chart is growing in size.", "chatgpt-answer": "B. growing", "video-llm-prediction": "A digital bar chart is shown, and it is growing in size.", "gt-answer": "B. growing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the digital bar chart remains in the same size throughout the video, indicating that there is no change in its size.", "chatgpt-answer": "A. staying in the same size", "video-llm-prediction": "A digital bar chart is shown, and it remains in the same size throughout the video.", "gt-answer": "B. growing", "rating": 0 } ] }, "1080990179": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the apple is shown growing bigger. It goes from a close-up shot of an apple to showing the apple growing bigger, which indicates growth.", "chatgpt-answer": "C. growing bigger", "video-llm-prediction": "The video shows the process of an apple ripening and drying out. The video starts with a close-up shot of an apple, and then it shows the apple growing bigger. The video then shows the apple shrinking and drying out. The video ends with a close-up shot of the apple. The information that is consistent with the video is that the apple is shown growing bigger.", "gt-answer": "B. shrinking and drying out", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the apple starts by ripening, then transitions to shrinking and drying out, and ends with growing bigger.", "chatgpt-answer": "C. growing bigger", "video-llm-prediction": "The video showcases the process of an apple ripening and drying out. It starts with a close-up shot of an apple, which then transitions to a shot of the apple being cut open to reveal the inside. The video then shows the apple being left out, which causes it to shrink and dry out. The video ends with a shot of the apple growing bigger.", "gt-answer": "B. shrinking and drying out", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the apple is initially cut in half, revealing the seeds and the process of ripening. It also shows the apple growing bigger and then shrinking and drying out. Therefore, the correct answer would be \"B. shrinking and drying out\" as it accurately describes what is happening to the apple throughout the video.", "chatgpt-answer": "B. shrinking and drying out", "video-llm-prediction": "The video shows the process of an apple ripening and drying out. The apple is initially cut in half and then shown from the inside, revealing the seeds and the process of the apple ripening. The video also shows the apple growing bigger and shrinking and drying out.", "gt-answer": "B. shrinking and drying out", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, the apple goes through two main processes. First, it ripens and then it shrinks and dries out. It starts with a close-up of an apple followed by cutting it in half, showing the seeds and the process of the apple ripening. Then, the video shows the apple drying out and shrinking. None of the choices can fully explain the two processes mentioned in the video description, but the closest option is B. shrinking and drying out.", "chatgpt-answer": "B. shrinking and drying out", "video-llm-prediction": "The video showcases the process of an apple ripening and drying out. It starts with a close-up of an apple, which then transitions to a shot of the apple being cut in half. The inside of the apple is then shown, revealing the seeds and the process of the apple ripening. The video then shows the apple drying out and shrinking, highlighting the natural process of an apple's life cycle.", "gt-answer": "B. shrinking and drying out", "rating": 1 } ] }, "1057163434": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the chef starts by putting mayonnaise on the bread and then adds meat to the bread. This indicates that the bread is being used as a base or a bun for the burger, not being eaten, thrown away or placed on top of the burger.", "chatgpt-answer": "C. putting it inside the burger", "video-llm-prediction": "The video showcases a chef making a delicious burger. The chef starts by putting mayonnaise on the bread and then adds meat to the bread. He then adds lettuce and tomatoes to the burger. Finally, he adds cheese to the burger and serves it on a plate.", "gt-answer": "B. putting it on top of the burger", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the chef is preparing a burger. In the video, the chef puts the bun on a plate and then adds ingredients like cheese, tomatoes, and lettuce on top of it. This indicates that the chef is putting the bread on top of the burger.", "chatgpt-answer": "B. putting it on top of the burger", "video-llm-prediction": "The video showcases a chef preparing a delicious burger. The chef starts by putting a burger patty on a bun and then adds cheese, tomatoes, and lettuce. The chef then adds some sauce on top of the burger and serves it on a plate. The video is a great example of how to make a tasty burger.", "gt-answer": "B. putting it on top of the burger", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the chef is putting meat, cheese, and vegetables on top of a bun. This indicates that the chef is using the bread as part of the burger bun.", "chatgpt-answer": "C. putting it inside the burger", "video-llm-prediction": "A chef is shown making a burger by putting meat, cheese, and vegetables on top of a bun.", "gt-answer": "B. putting it on top of the burger", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef is putting the bread on top of the burger, indicating that the chef is using it as a bun for the burger.", "chatgpt-answer": "B. putting it on top of the burger", "video-llm-prediction": "A chef is seen preparing a burger by putting it on top of a bun and adding various ingredients.", "gt-answer": "B. putting it on top of the burger", "rating": 1 } ] }, "1085910917": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that the woman is seen drinking water from a glass.", "chatgpt-answer": "A. drinking", "video-llm-prediction": "A woman is seen drinking water from a glass.", "gt-answer": "A. drinking", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is \"drinking water from a glass\".", "chatgpt-answer": "A. drinking", "video-llm-prediction": "A woman is seen drinking water from a glass while standing in a kitchen.", "gt-answer": "A. drinking", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the woman is drinking water from a glass.", "chatgpt-answer": "A. drinking", "video-llm-prediction": "A woman drinks water from a glass.", "gt-answer": "A. drinking", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is drinking water from a glass.", "chatgpt-answer": "A. drinking", "video-llm-prediction": "A woman is seen drinking water from a glass.", "gt-answer": "A. drinking", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description states that the woman is seen drinking water from a glass and turning back. This implies that she performs the action of drinking water first, and then turns back.", "chatgpt-answer": "A. drinking a glass of water and then turning back", "video-llm-prediction": "A woman is seen drinking water from a glass and turning back.", "gt-answer": "A. drinking a glass of water and then turning back", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is drinking water from a glass and turning back. Therefore, the events occur in the sequence of drinking a glass of water first, and then turning back.", "chatgpt-answer": "A. drinking a glass of water and then turning back", "video-llm-prediction": "A woman is seen drinking water from a glass and turning back.", "gt-answer": "A. drinking a glass of water and then turning back", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman drinks water from a glass and then turns back. This indicates that the event of drinking water occurs before the event of turning back.", "chatgpt-answer": "A. drinking a glass of water and then turning back", "video-llm-prediction": "A woman drinks water from a glass and turns back.", "gt-answer": "A. drinking a glass of water and then turning back", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is first seen drinking water from a glass and then turning back.", "chatgpt-answer": "A. drinking a glass of water and then turning back", "video-llm-prediction": "A woman is seen drinking water from a glass and turning back.", "gt-answer": "A. drinking a glass of water and then turning back", "rating": 1 } ] }, "1058907236": { "action": [ { "chatgpt-reasoning": "The video description clearly mentions that the squirrel is foraging for food in a forest. It is seen picking up nuts and eating them while standing on a tree stump and a tree branch.", "chatgpt-answer": "C. Foraging", "video-llm-prediction": "The video shows a squirrel foraging for food in a forest. The squirrel is seen picking up a nut and eating it while standing on a tree stump. The squirrel is also seen eating a nut while standing on a tree branch. The video provides a glimpse into the natural behavior of a squirrel in its natural habitat.", "gt-answer": "C. Foraging", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the squirrel is foraging for food, eating nuts, walking around, and sleeping in a tree.", "chatgpt-answer": "C. Foraging", "video-llm-prediction": "A squirrel is seen foraging for food in a forest. It is seen eating nuts and walking around the forest. The squirrel is also seen sleeping in a tree.", "gt-answer": "C. Foraging", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the squirrel is foraging for food in the woods, indicating that it is searching for and collecting food.", "chatgpt-answer": "C. Foraging", "video-llm-prediction": "A squirrel is seen foraging for food in the woods.", "gt-answer": "C. Foraging", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the squirrel is \"foraging for food in a forest.\"", "chatgpt-answer": "C. Foraging", "video-llm-prediction": "A squirrel is seen foraging for food in a forest.", "gt-answer": "C. Foraging", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "Based on the video description, the squirrel is seen picking up a nut and then turning back. The description specifically mentions \"The squirrel is seen in its natural habitat\", implying that the actions described are observed in the video.", "chatgpt-answer": "C. Picking up a nut followed by turning back", "video-llm-prediction": "In the video, a squirrel is seen picking up a nut and turning back. The squirrel then continues to eat the nut. The video showcases the squirrel's natural behavior of foraging for food. The squirrel's actions are typical of a squirrel's behavior, and the video provides a glimpse into the squirrel's daily routine. The video is shot in a natural setting, and the squirrel is seen in its natural habitat. The video is a great example of the beauty of nature and the importance of preserving it.", "gt-answer": "C. Picking up a nut followed by turning back", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the squirrel is picking up a nut and then turning back. Therefore, the correct order of events is \"Picking up a nut followed by turning back\".", "chatgpt-answer": "C. Picking up a nut followed by turning back", "video-llm-prediction": "A squirrel is seen in a forest, picking up a nut and turning back. The squirrel then continues to eat the nut.", "gt-answer": "C. Picking up a nut followed by turning back", "rating": 1 }, { "chatgpt-reasoning": "From the video description, it is mentioned that the squirrel picks up a nut and then turns back. This implies that the correct order of events is picking up a nut followed by turning back.", "chatgpt-answer": "C. Picking up a nut followed by turning back", "video-llm-prediction": "A squirrel picks up a nut and turns back.", "gt-answer": "C. Picking up a nut followed by turning back", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the squirrel first picks up a nut and then turns back. Therefore, the correct order of the events is picking up a nut followed by turning back.", "chatgpt-answer": "C. Picking up a nut followed by turning back", "video-llm-prediction": "The video shows a squirrel picking up a nut and turning back.", "gt-answer": "C. Picking up a nut followed by turning back", "rating": 1 } ] }, "1077575504": { "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly states that the pile of salt is gradually shrinking.", "chatgpt-answer": "A. shrinking", "video-llm-prediction": "The video shows a pile of salt that is gradually shrinking.", "gt-answer": "B. growing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the pile of salt is being poured into a container and then melting and disappearing. This indicates that the salt is melting and ultimately disappearing.", "chatgpt-answer": "C. melting", "video-llm-prediction": "The video showcases a pile of salt that is being poured into a container. The salt is then seen melting and disappearing.", "gt-answer": "B. growing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the pile of salt is shrinking.", "chatgpt-answer": "A. shrinking", "video-llm-prediction": "A pile of salt is shown, and it is shrinking.", "gt-answer": "B. growing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the pile of salt is shrinking. None of the other choices (growing, melting, disappearing) accurately describe what is happening to the salt.", "chatgpt-answer": "A. shrinking", "video-llm-prediction": "A pile of salt is shown, and it is seen shrinking.", "gt-answer": "B. growing", "rating": 0 } ] }, "23370985": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the person is melting the ice with a lighter, and the ice gradually melts away. This indicates that the ice crystal is undergoing the process of melting.", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of melting ice, which is a fascinating natural phenomenon. The video starts with a close-up shot of ice, which then transitions to a person melting the ice with a lighter. The camera captures the process of melting, and the ice gradually melts away. The video also includes a shot of the person holding the ice in their hand, which is a common practice in scientific experiments. Overall, the video provides a detailed and informative look at the process of melting ice.", "gt-answer": "A. freezing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the focus is on the melting process of the ice. It describes how the ice transforms from solid to liquid, highlighting the beauty of the melting process. Therefore, the correct answer is B. melting.", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of ice melting, with a focus on the melting process. The video begins with a close-up shot of ice, which then transitions to a shot of water dripping onto the ice. The camera then pans out to show the entire ice melting process. The video highlights the beauty of the melting process and the transformation of the ice from solid to liquid. The sound of dripping water and the visuals of the ice melting create a calming and soothing effect. Overall, the video provides a mesmerizing experience of watching the ice melting process.", "gt-answer": "A. freezing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the ice crystals are seen melting.", "chatgpt-answer": "B. melting", "video-llm-prediction": "A close-up of ice crystals is shown, and they are seen melting.", "gt-answer": "A. freezing", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the ice is melting and turning into water.", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of ice melting, with a focus on the melting process. The video starts with a close-up shot of ice, which then transitions to a shot of the ice melting. The melting process is then shown in detail, with the ice gradually melting and turning into water. The video ends with a shot of the water that is left after the ice has melted.", "gt-answer": "A. freezing", "rating": 0 } ] }, "1100319395": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the white circle with a black dot is moving in a clockwise direction, and then it shows that the same object is moving in a counter-clockwise direction. This indicates a change in direction from clockwise to counter-clockwise.", "chatgpt-answer": "C. counter-clockwise", "video-llm-prediction": "A white circle with a black dot in the center is shown, followed by a white circle with a black dot moving in a clockwise direction. The video then shows a white circle with a black dot moving in a counter-clockwise direction.", "gt-answer": "A. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the circular pattern is moving in a clockwise direction.", "chatgpt-answer": "A. clockwise", "video-llm-prediction": "The video showcases a circular pattern that moves in a clockwise direction. The pattern is then shown moving in the opposite direction.", "gt-answer": "A. clockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the circular pattern is moving in a clockwise direction.", "chatgpt-answer": "A. clockwise", "video-llm-prediction": "A circular pattern is shown in the video, and it moves in a clockwise direction.", "gt-answer": "A. clockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the circular pattern moves in both clockwise and counter-clockwise directions.", "chatgpt-answer": "B. not moving", "video-llm-prediction": "The video showcases a circular pattern that moves in a clockwise direction, followed by a circular pattern that moves in a counter-clockwise direction.", "gt-answer": "A. clockwise", "rating": 0 } ] }, "1067268406": { "speed": [ { "chatgpt-reasoning": "The video description states that the car is seen driving on the highway at the same speed as the camera, at a faster speed than the camera, and at a slower speed than the camera. This suggests that the car is driving at different speeds.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a car driving on a highway at the same speed as the camera. The car is seen driving on the highway at a faster speed than the camera. The car is also seen driving on the highway at a slower speed than the camera. The video captures the car driving on the highway at different speeds.", "gt-answer": "B. faster than the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the car is driving down the highway at the same speed as the camera.", "chatgpt-answer": "A. at the same speed as the camera", "video-llm-prediction": "The video showcases a car driving down a highway at the same speed as the camera. The car is seen passing by wind turbines and a bridge. The car is also seen driving on a bridge and a highway. The video captures the serene beauty of the surroundings and the peacefulness of the drive.", "gt-answer": "B. faster than the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the car drives down a highway at the same speed as the camera, indicating that the speed of the car is equal to the speed of the camera.", "chatgpt-answer": "A. at the same speed as the camera", "video-llm-prediction": "A car drives down a highway at the same speed as the camera.", "gt-answer": "B. faster than the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the car is seen driving at the same speed as the camera.", "chatgpt-answer": "A. at the same speed as the camera", "video-llm-prediction": "The video showcases a car driving on a highway during a beautiful sunset. The car is seen driving at the same speed as the camera, and the sunset creates a serene and peaceful atmosphere. The video captures the car's journey on the highway, with the sunset serving as a stunning backdrop.", "gt-answer": "B. faster than the camera", "rating": 0 } ] }, "1092682551": { "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the cars are traveling at the same speed as the camera.", "chatgpt-answer": "A. travel at the same speed as the camera", "video-llm-prediction": "The video shows a busy city street with cars traveling at the same speed as the camera. The cars are seen driving on the street and passing under a bridge. The video captures the hustle and bustle of the city, with the sound of engines revving and the honking of horns adding to the chaos. The camera pans around the street, showing the cars moving in all directions, with some cars driving faster than the camera and others driving slower. The video provides a glimpse into the daily life of city dwellers, with the cars serving as a symbol of the constant movement and activity that", "gt-answer": "C. travel slower than the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the cars are traveling at different speeds. Therefore, it is clear that the speed of the cars is not the same as the camera.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a busy city street with cars traveling at different speeds. The camera captures the movement of the cars as they navigate through the bustling cityscape. The video provides a glimpse into the daily life of city dwellers and the constant movement of vehicles on the streets.", "gt-answer": "C. travel slower than the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the cars are seen traveling at the same speed as the camera, as well as faster and slower than the camera. This indicates that the cars have varying speeds in relation to the camera.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a busy city street with cars traveling at the same speed as the camera. The cars are seen driving on the street, and the camera captures the movement of the cars. The video also shows the cars traveling faster than the camera and slower than the camera. The video captures the hustle and bustle of the city street, with the cars moving in different directions. The video provides a glimpse into the daily life of the city and the constant movement of the cars.", "gt-answer": "C. travel slower than the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the cars are \"traveling at the same speed as the camera.\"", "chatgpt-answer": "A. travel at the same speed as the camera", "video-llm-prediction": "The video showcases a busy city street with cars traveling at the same speed as the camera. The camera captures the bustling cityscape, with cars moving in various directions, and the sound of honking and revving engines adding to the chaos. The camera then pans up to show the tall buildings surrounding the street, with their windows reflecting the city's lights. The camera then moves to the top of the street, where it captures the cars moving in the opposite direction, with the sound of engines and horns filling the air. The camera then pans down to the street, where the", "gt-answer": "C. travel slower than the camera", "rating": 0 } ] }, "1101200293": { "direction": [ { "chatgpt-reasoning": "The video description states that the camera pans around the carrier and showcases the rotation of the aircraft carrier. This indicates that the camera is moving in a circular motion around the carrier. Based on the description, I can infer that the camera motion is counterclockwise.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video showcases a large aircraft carrier with numerous fighter jets parked on its deck. The camera pans around the carrier, showcasing the impressive size and the various positions of the jets. The video then transitions to a computer-generated animation of the aircraft carrier, which is shown rotating in different directions. The animation is used to emphasize the size and movement of the aircraft carrier and the fighter jets. The video ends with a shot of the aircraft carrier and the fighter jets parked on its deck. Overall, the video provides a detailed view of", "gt-answer": "D. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the aircraft carrier is seen moving across the ocean. Based on this information, we can infer that the camera motion is most likely showing the movement of the carrier from a fixed position. If the camera was moving in any specific direction relative to the carrier, it would have been mentioned in the video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a large aircraft carrier with numerous fighter jets parked on its deck. The carrier is seen moving across the ocean, with the fighter jets following in a line. The video captures the impressive size and power of the aircraft carrier and the precision of the fighter jets as they move in unison.", "gt-answer": "D. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera starts with a view of the entire group of airplanes parked on the boat and then zooms in on the airplanes. This indicates that the camera is moving closer to the subject, which is upward motion.", "chatgpt-answer": "C. upward", "video-llm-prediction": "A video of a large group of airplanes parked on a boat. The video starts with a view of the entire group of airplanes parked on the boat. The camera then zooms in on the airplanes, showing them parked in a neat row. The video then shows the airplanes from a distance, still parked in a row. The video ends with a view of the entire group of airplanes parked on the boat.", "gt-answer": "D. clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera starts with a wide shot of the entire scene, then zooms in on the airplanes, and finally pans out to show the entire scene again. This implies that the camera is moving in a circular motion around the aircraft carrier.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "A large group of airplanes are parked on a boat, and they are all facing the same direction. The video starts with a wide shot of the entire scene, and then zooms in on the airplanes. The camera then pans out to show the entire scene again. The video ends with a shot of the entire scene.", "gt-answer": "D. clockwise", "rating": 0 } ] }, "1072453637": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera is capturing the movement of the fighter jet from various angles, including shots from the back and from the front. It also mentions that the camera is panning downwards and panning upwards.", "chatgpt-answer": "B. panning downwards around a fighter jet", "video-llm-prediction": "The video showcases a fighter jet flying through the sky, with the camera capturing its movement from various angles. The jet is seen from the back, panning downwards, and then from the front, panning upwards. The video also includes a shot of the jet flying through the sky, with the camera capturing its movement from various angles. Overall, the video provides a dynamic and engaging view of the fighter jet in action.", "gt-answer": "A. panning to the back of a fighter jet", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera is capturing the fighter jet's movements from various angles, including a shot of the back of the jet and a close-up of the front of the jet. It does not mention any panning downwards or upwards around the jet.", "chatgpt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "The video showcases a fighter jet flying through the sky, with the camera capturing its movements from various angles. The jet is seen flying in different directions, including upwards, downwards, and around in a circle. The video also includes a shot of the back of the jet and a close-up of the front of the jet. The fighter jet is shown flying through the sky, with the camera capturing its movements from various angles. The video provides a detailed view of the jet's flight, from its speed and maneuverability to its aerodynamic design. Overall, the video is a capt", "gt-answer": "A. panning to the back of a fighter jet", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera is panning around the fighter jet, showing different angles including the back, front, and sides. This indicates that the camera is moving horizontally to capture the different views of the jet.", "chatgpt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "A fighter jet is seen flying in the sky, with the camera panning around it. The jet is shown from different angles, including the back, front, and sides. The video captures the jet's movement and flight in the sky.", "gt-answer": "A. panning to the back of a fighter jet", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the camera is panning around the fighter jet. Since the video captures the beauty and power of the jet as it soars through the sky, it is likely that the camera is panning to showcase different angles of the jet, including the front and back.", "chatgpt-answer": "D. panning to the front of a fighter jet", "video-llm-prediction": "A fighter jet is seen flying in the sky, with the camera panning around it. The jet is shown from different angles, including the front and back. The video captures the beauty and power of the fighter jet as it soars through the sky.", "gt-answer": "A. panning to the back of a fighter jet", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that the fighter jet initially shoots three missiles, and then shoots four more missiles.", "chatgpt-answer": "A. shooting three missiles, then shooting four missiles", "video-llm-prediction": "The video shows a fighter jet flying in the sky and shooting three missiles. The jet then shoots four more missiles.", "gt-answer": "C. shooting one missile, then shooting two missiles", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states the order of events for the fighter jet. It first shoots three missiles, then shoots four more missiles, and finally shoots three additional missiles.", "chatgpt-answer": "A. shooting three missiles, then shooting four missiles", "video-llm-prediction": "The video showcases a fighter jet flying in the sky and shooting three missiles, followed by shooting four more missiles. The jet then shoots three more missiles, and the video ends with the jet flying away.", "gt-answer": "C. shooting one missile, then shooting two missiles", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the fighter jet shoots three missiles first, and then shoots four missiles.", "chatgpt-answer": "A. shooting three missiles, then shooting four missiles", "video-llm-prediction": "The fighter jet shoots three missiles, then shoots four missiles.", "gt-answer": "C. shooting one missile, then shooting two missiles", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the fighter jet shoots three missiles first, and then shoots four more missiles. None of the other answer choices match this order of events.", "chatgpt-answer": "A. shooting three missiles, then shooting four missiles", "video-llm-prediction": "The video captures a fighter jet flying in the sky and shooting three missiles. The jet then shoots four more missiles, and the video ends.", "gt-answer": "C. shooting one missile, then shooting two missiles", "rating": 0 } ] }, "3396473605": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the five stars appear from right to left.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "The video shows a man walking on a sidewalk and then entering a building. The video then shows a blue screen with five stars appearing from right to left.", "gt-answer": "C. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about stars appearing in any direction. Therefore, it is not possible to determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a man who is seen speaking to the camera while holding a baseball bat. He then proceeds to hit a baseball, which is shown in slow motion. The video ends with the man speaking to the camera again.", "gt-answer": "C. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the five stars appear from right to left.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "Five stars appear from right to left.", "gt-answer": "C. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the direction in which the stars appear. None of the choices can be determined based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video features a man who is seen speaking to the camera while holding a bottle of mouthwash. He then proceeds to gargle the mouthwash and spits it out into the sink. The video ends with the man waving goodbye to the camera.", "gt-answer": "C. from left to right", "rating": 0 } ] }, "1086820415": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the wave is moving vertically towards the top of the screen and then continues to move horizontally towards the right side of the screen.", "chatgpt-answer": "B. moving horizontally towards the right side of the screen", "video-llm-prediction": "The video showcases a large wave moving vertically towards the top of the screen. The wave is seen crashing down in the water, creating a beautiful display of white foam. The wave continues to move horizontally towards the right side of the screen, creating a sense of motion and excitement. The video captures the power and beauty of the ocean, and the wave's movement is a testament to the force of nature.", "gt-answer": "C. moving vertically towards the bottom of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the large wave is moving towards the top of the screen.", "chatgpt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "The video showcases a large wave moving towards the top of the screen, followed by a series of waves moving horizontally towards the right side of the screen. The waves continue to move towards the bottom of the screen, creating a mesmerizing view. The waves are so large that they almost cover the entire screen, making it a breathtaking sight to watch. The video captures the beauty and power of nature, as the waves crash against each other, creating a symphony of sound and visuals. Overall, the video is a stunning display of the natural world and its power.", "gt-answer": "C. moving vertically towards the bottom of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the large wave is moving vertically towards the top of the screen.", "chatgpt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "The video shows a large wave moving vertically towards the top of the screen.", "gt-answer": "C. moving vertically towards the bottom of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the large wave is moving vertically towards the top of the screen.", "chatgpt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "A large wave is seen moving vertically towards the top of the screen.", "gt-answer": "C. moving vertically towards the bottom of the screen", "rating": 0 } ] }, "1081513610": { "action": [ { "chatgpt-reasoning": "The video description clearly states that two men are sitting at a table, one using a laptop while the other is holding a pen and paper. The men are seen writing and pointing to something, indicating that they are engaged in some kind of activity or discussion.", "chatgpt-answer": "B. discussing", "video-llm-prediction": "Two men are sitting at a table, one of them is using a laptop while the other is holding a pen and paper. The man using the laptop is seen writing on the paper while the other man is pointing to something. The man with the pen and paper then starts writing on the paper while the other man continues to use the laptop.", "gt-answer": "B. discussing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that two men are sitting at a table, one of them is wearing glasses and the other is not. They are both holding pens and the man with glasses is also holding a laptop. The man with glasses is pointing to the laptop and the other man is nodding his head. Based on these clues, it can be inferred that the two men are having some form of communication or discussion.", "chatgpt-answer": "B. discussing", "video-llm-prediction": "Two men are sitting at a table, one of them is wearing glasses and the other is not. The man with glasses is holding a pen and a laptop, while the other man is holding a pen and a notebook. The man with glasses is pointing to the laptop and the other man is nodding his head.", "gt-answer": "B. discussing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that one man is using a laptop and pointing to something on the screen, while the other man is holding a pen and paper and writing. This indicates that they are engaged in some sort of discussion or collaboration.", "chatgpt-answer": "B. discussing", "video-llm-prediction": "Two men are sitting at a table, one of them is using a laptop while the other is holding a pen and paper. The man using the laptop is pointing to something on the screen while the other man is writing on the paper.", "gt-answer": "B. discussing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that one man is using a laptop while the other is writing on a piece of paper. Additionally, the man using the laptop is pointing to something on the screen. This suggests that the two men are engaged in some form of communication or discussion.", "chatgpt-answer": "B. discussing", "video-llm-prediction": "Two men are sitting at a table, one of them is using a laptop while the other is writing on a piece of paper. The man using the laptop is pointing to something on the screen while the other man is writing.", "gt-answer": "B. discussing", "rating": 1 } ] }, "1073831006": { "action": [ { "chatgpt-reasoning": "The video description explicitly mentions that the zebras are running through a field and some of them are jumping into the water.", "chatgpt-answer": "C. running", "video-llm-prediction": "The video shows a group of zebras running through a field, with some of them jumping into the water. The information that is consistent with the video is that the zebras are running.", "gt-answer": "C. running", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the zebras are running through a field, jumping into the water. There is no mention of swimming or sleeping.", "chatgpt-answer": "C. running", "video-llm-prediction": "The video shows a group of zebras running through a field, with some of them jumping into the water. The zebras are seen running in a line, and some of them are seen running in a circle. The video captures the zebras in their natural habitat, with the grass and trees in the background. The zebras are seen running in a line, with some of them jumping into the water. The video provides a glimpse into the natural behavior of zebras and their ability to adapt to their environment.", "gt-answer": "C. running", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the zebras are running through a field and some of them are jumping into the water. There is no information indicating that they are swimming or sleeping.", "chatgpt-answer": "C. running", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them jumping into the water.", "gt-answer": "C. running", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the zebras are running through a field and some of them are jumping into the water. Therefore, the correct answer is C. running.", "chatgpt-answer": "C. running", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them jumping into the water.", "gt-answer": "C. running", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that some zebras are running from right to left and others are running from left to right.", "chatgpt-answer": "A. from right to left, B. from left to right", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them running towards the water. The zebras are seen running in different directions, with some running from right to left and others from left to right.", "gt-answer": "B. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that some zebras are running from right to left and others are running from left to right. This indicates that the direction of the zebras' movement is not strictly from one side to the other but rather in both directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them running from right to left and others from left to right. The zebras are seen running in a herd, with some of them running towards the camera and others running away from it. The field is surrounded by tall grass, and the zebras are running with their tails up. The video captures the zebras in their natural habitat, with the sound of their hooves pounding against the ground. The zebras are seen running in a line, with some of them running faster than others. The video provides a", "gt-answer": "B. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the zebras are running from right to left.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "A group of zebras are seen running through a field. They are running from right to left, and then they stop and turn around.", "gt-answer": "B. from left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that some zebras are running from right to left, while others are running from left to right.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "A group of zebras is seen running through a field, with some of them running towards the water. The zebras are seen running in different directions, with some running from right to left, while others run from left to right. The video captures the zebras in motion, with their distinct black and white stripes visible as they run. The field is vast and open, with no other animals or objects visible in the frame. The video provides a glimpse into the natural behavior of zebras in their natural habitat.", "gt-answer": "B. from left to right", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the zebras are running in a line, with some of them running faster than others. Additionally, it mentions the sound of hooves pounding against the ground, indicating movement and speed.", "chatgpt-answer": "C. fast motion", "video-llm-prediction": "The video shows a group of zebras running through a field. The zebras are seen running in a line, with some of them running faster than others. The video captures the zebras in motion, with their distinct black and white stripes visible. The sound of hooves pounding against the ground can be heard, adding to the immersive experience. The video ends with the zebras stopping and standing still in the field. Overall, the video provides a glimpse into the natural behavior of zebras in their natural habitat.", "gt-answer": "A. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that some zebras are running faster than others, indicating that they are not in slow motion or stationary. Additionally, the video captures their natural behavior and movement, so it can be assumed that the speed is normal for zebras.", "chatgpt-answer": "D. normal speed", "video-llm-prediction": "The video shows a group of zebras running through a field, with some of them running faster than others. The zebras are seen running in different directions, and some of them are running alone while others are running in pairs. The video captures the zebras' natural behavior and movement in their natural habitat.", "gt-answer": "A. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video captures the zebras in different speeds, including slow motion, stationary, and fast motion. It also states that the zebras are seen running through a field. Therefore, the correct answer is that the zebras are shown in all of the mentioned speeds - slow motion, stationary, fast motion, and normal speed.", "chatgpt-answer": "D. normal speed", "video-llm-prediction": "A group of zebras are seen running through a field in slow motion. They are chasing each other and kicking up dust as they run. The video captures the zebras in different speeds, including slow motion, stationary, and fast motion. The video also shows the zebras in a normal speed.", "gt-answer": "A. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the zebras are running at a slow pace.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "A group of zebras are seen running through a field of tall grass. The video is in slow motion, and the zebras are running at a slow pace. The zebras are seen running in a herd, and the camera captures their movements as they run through the field. The video provides a beautiful view of the zebras in their natural habitat, and the slow motion effect adds to the overall beauty of the video.", "gt-answer": "A. slow motion", "rating": 1 } ] }, "1069338034": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the mother elephant is eating grass and drinking water, while the baby elephant is playing in the water and drinking water from the river.", "chatgpt-answer": "A. eating and drinking", "video-llm-prediction": "The video shows a mother elephant and her baby elephant in a river. The mother elephant is seen eating grass and drinking water while the baby elephant is playing in the water. The video also shows the baby elephant drinking water from the river.", "gt-answer": "A. eating and drinking", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, the mother elephant is seen eating grass while the baby elephant plays in the water and drinks water from the river.", "chatgpt-answer": "A. eating and drinking", "video-llm-prediction": "The video showcases a mother elephant and her baby elephant as they enjoy a peaceful day by the river. The mother elephant is seen eating grass while her baby elephant plays in the water. The baby elephant is also seen drinking water from the river. The video captures the beauty of nature and the bond between a mother and her baby.", "gt-answer": "A. eating and drinking", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that both the mother elephant and her baby elephant are drinking water from the river. Additionally, it states that the baby elephant is playing with a stick in the water. Therefore, the elephants in the video are both drinking and playing.", "chatgpt-answer": "C. eating and playing", "video-llm-prediction": "The video shows a mother elephant and her baby elephant playing in the water. The baby elephant is seen drinking water from the river while the mother elephant is also drinking water. The video also shows the baby elephant playing with a stick in the water.", "gt-answer": "A. eating and drinking", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the elephants are eating and drinking, resting, playing in the water, and some of them are even seen sleeping.", "chatgpt-answer": "A. eating and drinking", "video-llm-prediction": "A herd of elephants can be seen enjoying their time in the water. Some of them are eating and drinking while others are resting. The elephants are seen playing in the water, and some of them are even seen sleeping. The video captures the peaceful and playful nature of these majestic creatures.", "gt-answer": "A. eating and drinking", "rating": 1 } ] }, "1076880707": { "action": [ { "chatgpt-reasoning": "The video description mentions that the bear is climbing a tree and eating honey. It also states that the bear is seen scratching against a tree. Both options A (eating honey) and C (scratching against a tree) are mentioned in the video description as activities of the bear near the tree.", "chatgpt-answer": "A. eating honey and C. scratching against a tree", "video-llm-prediction": "A brown bear is seen in a forest, climbing a tree and eating honey. The bear is also seen scratching against a tree.", "gt-answer": "C. scratching against a tree", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the bear is seen climbing a tree, scratching against it, and eating honey from a tree.", "chatgpt-answer": "A. eating honey", "video-llm-prediction": "A bear is seen in a forest, climbing a tree and scratching against it. The bear is also seen eating honey from a tree.", "gt-answer": "C. scratching against a tree", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the bear is eating honey from a tree and later climbs the tree and scratches against it.", "chatgpt-answer": "A. eating honey, B. climbing a tree, C. scratching against a tree", "video-llm-prediction": "A bear is seen eating honey from a tree. The bear then climbs the tree and scratches against it.", "gt-answer": "C. scratching against a tree", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the bear is seen climbing a tree and scratching against it. Additionally, it mentions that the bear is also seen eating honey from a tree. Both climbing a tree and eating honey are actions that the bear is doing near the tree.", "chatgpt-answer": "A. eating honey, B. climbing a tree", "video-llm-prediction": "A brown bear is seen in a forest, climbing a tree and scratching against it. The bear is also seen eating honey from a tree.", "gt-answer": "C. scratching against a tree", "rating": 0 } ] }, "1092278063": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the two rows of duck toys are moving in opposite directions on a conveyor belt. The description mentions that the toys are placed on a conveyor belt and shows a close-up of the toys moving in opposite directions.", "chatgpt-answer": "A. moving in opposite directions on a conveyor belt", "video-llm-prediction": "The video shows a conveyor belt with two rows of duck toys moving in opposite directions. The toys are yellow in color and are placed in a black box. The video also shows a close-up of the toys moving on the conveyor belt. The video ends with the toys moving in the same direction on the conveyor belt.", "gt-answer": "A. moving in opposite directions on a conveyor belt", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the two rows of duck toys are moving in opposite directions on a conveyor belt.", "chatgpt-answer": "A. moving in opposite directions on a conveyor belt", "video-llm-prediction": "The video shows a conveyor belt with two rows of duck toys moving in opposite directions. The toys are yellow in color and are placed on a black checkered floor. The video also shows a close-up of the toys. The toys are made of rubber and are placed on a conveyor belt. The video ends with the toys still in motion.", "gt-answer": "A. moving in opposite directions on a conveyor belt", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the two rows of duck toys are moving in opposite directions on a conveyor belt.", "chatgpt-answer": "A. moving in opposite directions on a conveyor belt", "video-llm-prediction": "A video shows two rows of duck toys moving in opposite directions on a conveyor belt. The toys are yellow in color and are placed in a black box. The video also shows a close-up of the toys.", "gt-answer": "A. moving in opposite directions on a conveyor belt", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the two rows of duck toys are moving in opposite directions on a conveyor belt.", "chatgpt-answer": "A. moving in opposite directions on a conveyor belt", "video-llm-prediction": "The video showcases a conveyor belt with two rows of duck toys moving in opposite directions. The toys are yellow in color and are placed on a black background. The video captures the movement of the toys as they move along the conveyor belt. The video also shows a close-up of the toys, highlighting their unique design and features. Overall, the video provides a visually appealing and engaging experience for the viewers.", "gt-answer": "A. moving in opposite directions on a conveyor belt", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description states that the ducks on the conveyor belt are moving at a normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video shows a conveyor belt with yellow rubber ducks moving along it. The ducks are moving at a normal speed, but one of them is moving at a super fast speed. The video also shows a box with a yellow rubber duck in it.", "gt-answer": "A. normal speed", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the ducks are moving at different speeds along the conveyor belt. Since \"super fast speed\" and \"slow speed\" are extreme options, it is more likely that the conveyor belt is moving at a normal speed.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video showcases a conveyor belt with yellow rubber ducks moving along it. The ducks are seen in various positions, including sitting and standing, and are moving at different speeds. The video captures the movement of the ducks as they continue to move along the conveyor belt.", "gt-answer": "A. normal speed", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ducks on the conveyor belt are moving at a normal speed until they reach the end where they stop. This indicates that the speed of the conveyor belt is also normal.", "chatgpt-answer": "A. normal speed", "video-llm-prediction": "The video shows a conveyor belt with yellow rubber ducks moving along it. The ducks are moving at a normal speed until they reach the end of the conveyor belt where they stop.", "gt-answer": "A. normal speed", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ducks are moving at different speeds on the conveyor belt. However, it does not provide specific information about the speed of the conveyor belt.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a conveyor belt with yellow rubber ducks moving along it. The ducks are seen in different positions, including sitting and standing, and are moving at different speeds. The video captures the playful and whimsical nature of the scene, with the ducks seemingly enjoying their time on the conveyor belt. The video is a fun and lighthearted watch, and the viewer can appreciate the attention to detail in the depiction of the ducks' movements.", "gt-answer": "A. normal speed", "rating": 0 } ] }, "1024867412": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the dog is driving a car, smiling, and waving at the camera.", "chatgpt-answer": "B. driving a car", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is seen smiling and waving at the camera while driving. The video ends with the dog driving the car.", "gt-answer": "B. driving a car", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the dog is seen driving a car while wearing sunglasses. It also mentions that the dog is eating and sleeping in the car.", "chatgpt-answer": "B. driving a car", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is also seen eating and sleeping in the car.", "gt-answer": "B. driving a car", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the dog is driving a car while wearing sunglasses, as well as eating and sleeping in the car.", "chatgpt-answer": "B. driving a car", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is also seen eating and sleeping in the car.", "gt-answer": "B. driving a car", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the dog is seen driving a car while wearing sunglasses. It also mentions that the dog is seen eating and sleeping in the car.", "chatgpt-answer": "B. driving a car", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is also seen eating and sleeping in the car.", "gt-answer": "B. driving a car", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description clearly states that the dog is seen taking a left turn, going straight, taking a right turn, and going backward. This indicates that the car is driving in multiple directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is seen taking a left turn, going straight, taking a right turn, and going backward. The video showcases the dog's ability to drive a car while wearing sunglasses.", "gt-answer": "C. Taking a right turn", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the dog in the car is seen taking a left turn, going straight, and taking a right turn. This indicates that the car is driving in different directions throughout the video.", "chatgpt-answer": "A. Taking a left turn, B. Going straight, C. Taking a right turn", "video-llm-prediction": "A dog wearing sunglasses is seen driving a car on a street. The dog is seen taking a left turn, going straight, and taking a right turn. The video captures the dog's playful and adventurous spirit as it enjoys the ride.", "gt-answer": "C. Taking a right turn", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the dog is driving the car in different directions, including going backward.", "chatgpt-answer": "D. Going backward", "video-llm-prediction": "A dog is seen driving a car in the video. The dog is wearing sunglasses and a hat, and is seen driving the car in different directions. The video shows the dog driving in a straight line, taking a left turn, and going backward. The video also shows the dog smiling and waving at the camera.", "gt-answer": "C. Taking a right turn", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the dog is seen taking a left turn, going straight, taking a right turn, and going backward.", "chatgpt-answer": "D. Going backward", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is seen taking a left turn, going straight, taking a right turn, and going backward. The video captures the dog's playful and adventurous spirit as it enjoys the ride.", "gt-answer": "C. Taking a right turn", "rating": 0 } ] }, "1076877854": { "action": [ { "chatgpt-reasoning": "The video description explicitly mentions that the robots are caring for seedlings, watering plants, harvesting crops, and plowing the soil.", "chatgpt-answer": "A. caring for seedlings, B. watering plants, C. harvesting crops, D. plowing the soil", "video-llm-prediction": "The video showcases a group of robots working together to care for seedlings in a field. The robots are seen watering the plants and tending to them with precision. The video also highlights the robots' ability to harvest crops and plow the soil, showcasing their versatility and efficiency.", "gt-answer": "A. caring for seedlings", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the robots are caring for seedlings and watering the plants.", "chatgpt-answer": "A. caring for seedlings", "video-llm-prediction": "The video showcases a group of robots working together to care for seedlings in a field. The robots are seen watering the plants and tending to them with precision. The video highlights the efficiency and effectiveness of the robots in their task, making it clear that they are capable of handling such responsibilities. The video is a testament to the advancements in technology and how it can be used to improve agriculture.", "gt-answer": "A. caring for seedlings", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the robots are caring for seedlings, watering plants, harvesting crops, and plowing the soil.", "chatgpt-answer": "A. caring for seedlings, B. watering plants, C. harvesting crops, D. plowing the soil", "video-llm-prediction": "The video showcases a group of robots caring for seedlings in a greenhouse. The robots are seen watering the plants and tending to them with precision. The video also highlights the robots' ability to harvest crops and plow the soil, showcasing their versatility and efficiency in agricultural tasks.", "gt-answer": "A. caring for seedlings", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the robots are working together to care for seedlings in a greenhouse. It also mentions that they are seen watering the plants, harvesting crops, and plowing the soil.", "chatgpt-answer": "A. caring for seedlings, B. watering plants, C. harvesting crops, D. plowing the soil", "video-llm-prediction": "The video showcases a group of robots working together to care for seedlings in a greenhouse. The robots are seen watering the plants, harvesting crops, and plowing the soil. The video highlights the efficiency and precision of the robots in their work.", "gt-answer": "A. caring for seedlings", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "Since the camera is panning around the field and then panning back to the group of robotic arms, it implies that the camera is stationary and the closest robotic arm is moving relative to the camera's point of view. From the description, we cannot determine the exact direction in relation to the camera's point of view (e.g., left or right), so we cannot choose A or D. Also, there is no mention of the direction of movement of the closest robotic arm, so we cannot choose B or C.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of robotic arms working together to plant seeds in a field. The camera pans around the field, showing the different arms working in unison to plant the seeds. The video ends with the camera panning back to the group of robotic arms.", "gt-answer": "A. To the right side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the robotic arm is moving in different directions, including towards the camera and away from it. Since the question asks for the direction closest to the camera's point of view, the correct answer would be \"Towards the camera.\"", "chatgpt-answer": "B. Towards the camera", "video-llm-prediction": "The video showcases a robotic arm that is seen moving around a field of plants. The arm is seen moving in different directions, including towards the camera and away from it. The arm is also seen moving towards the right side of the screen. The video provides a glimpse into the world of robotics and how it can be used in agriculture. The use of robotics in agriculture can help increase efficiency and productivity in farming. The video highlights the importance of using technology to improve agriculture and make it more sustainable. The robotic arm is seen moving around the field of plants, indicating that", "gt-answer": "A. To the right side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the robotic arm moves towards the camera and then away from it. This indicates that the closest robotic arm is moving towards the camera.", "chatgpt-answer": "B. Towards the camera", "video-llm-prediction": "A robotic arm is shown in a field of plants. It moves towards the camera and then away from it.", "gt-answer": "A. To the right side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description states that one arm is moving towards the camera and the other arm is moving away from the camera. This means that the closest robotic arm is moving towards the camera.", "chatgpt-answer": "B. Towards the camera", "video-llm-prediction": "A robotic arm is seen moving around a field of plants, with one arm moving towards the camera and the other arm moving away from the camera.", "gt-answer": "A. To the right side of the screen", "rating": 0 } ] }, "1104673225": { "action": [ { "chatgpt-reasoning": "Based on the video description, the woman is seen sitting on a couch and eating a salad. Then she wraps up the salad and throws it away. Later, she is seen making the salad. Therefore, the correct answer is C. eating salad.", "chatgpt-answer": "C. eating salad", "video-llm-prediction": "A woman is seen sitting on a couch and eating a salad. She wraps up the salad and throws it away. Later, she is seen making the salad.", "gt-answer": "C. eating salad", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is holding a bowl of salad and proceeds to eat the salad. This indicates that she is eating salad.", "chatgpt-answer": "C. eating salad", "video-llm-prediction": "A woman is seen sitting on a couch, holding a bowl of salad. She then proceeds to eat the salad while looking off into the distance. The video seems to be focused on the woman and her actions.", "gt-answer": "C. eating salad", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is sitting on a couch, eating a salad, wrapping up the salad, throwing it away, and later making the salad. This indicates that the woman is doing multiple actions including eating salad, wrapping up salad, throwing away salad, and making salad.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen sitting on a couch and eating a salad. She wraps up the salad and throws it away. Later, she is seen making the salad.", "gt-answer": "C. eating salad", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is sitting on a couch and eating a salad. It also states that she wraps up the salad and throws it away. Therefore, the correct answer is that the woman is both eating salad and throwing away salad.", "chatgpt-answer": "C. eating salad", "video-llm-prediction": "A woman is seen sitting on a couch and eating a salad. She wraps up the salad and throws it away.", "gt-answer": "C. eating salad", "rating": 1 } ] }, "1100468035": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans to the left, pans to the right, and so on. This indicates that the camera is moving horizontally.", "chatgpt-answer": "D. panning left", "video-llm-prediction": "The video starts with a blue screen displaying the title of the video. Then, the camera pans to the left and zooms in on the left side of the room. The camera then pans to the right and zooms out on the right side of the room. The camera then pans to the left and zooms out on the left side of the room. Finally, the camera pans to the right and zooms out on the right side of the room.", "gt-answer": "B. zooming forward", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any specific information about the direction of the camera in the video. It only describes the various elements present in the video, such as the blue-lit room, rows of servers, and the blue-lit hallway. Without further details about the camera movement, it is impossible to determine the direction of the camera.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a blue-lit room with rows of servers and a blue-lit hallway with rows of servers. The video also features a blue-lit room with a blue-lit hallway.", "gt-answer": "B. zooming forward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera is panning left and right, capturing the entire room and hallway.", "chatgpt-answer": "D. panning left", "video-llm-prediction": "The video showcases a blue-lit room with a row of servers and a blue-lit hallway with a row of doors. The camera pans left and right, capturing the entire room and hallway.", "gt-answer": "B. zooming forward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans left and right, then zooms forward. This indicates that the camera is moving in different directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a blue-lit hallway with a row of doors on the right side. The camera pans left and right, revealing the blue-lit hallway. The camera then zooms forward, revealing the entire video.", "gt-answer": "B. zooming forward", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly states that the door is gradually opening.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video showcases a blue-lit hallway with a door that gradually opens.", "gt-answer": "C. gradually opening", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the door gradually opens and then closes. This implies that the initial state of the door is closed, it then opens, and finally closes again.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video showcases a door that gradually opens, revealing a room with a blue light. The door then closes, and the video ends.", "gt-answer": "C. gradually opening", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the door is gradually opening and then closing. This eliminates option A since the door is not remaining closed. The correct answer is C because the door is initially closed and then gradually opening before closing again.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video shows a door gradually opening and then closing.", "gt-answer": "C. gradually opening", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the door is gradually opening.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video showcases a door that gradually opens, revealing a room with a blue light. The door then closes, and the video ends.", "gt-answer": "C. gradually opening", "rating": 1 } ] }, "315784": { "speed": [ { "chatgpt-reasoning": "The video description states that the speedometer in the center is initially stationary and then shown moving slower and finally moving faster. This means that in relation to the speedometer on the left, the speedometer in the center appears to be moving slower.", "chatgpt-answer": "B. moving slower", "video-llm-prediction": "The video shows a speedometer in the center of the screen, which is stationary. The speedometer is then shown moving slower, and finally moving faster. The video does not provide any additional information about the speedometer.", "gt-answer": "C. moving faster", "rating": 0 }, { "chatgpt-reasoning": "According to the video description, the first speed displayed on the center speedometer is stationary. This means that in relation to the speedometer on the left, the center speedometer appears to be stationary.", "chatgpt-answer": "A. stationary", "video-llm-prediction": "The video showcases a speedometer in the center of the screen, which displays different speeds. The first speed displayed is stationary, while the second speed displayed is moving slower. The third speed displayed is moving faster.", "gt-answer": "C. moving faster", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the speedometer in the center displays different speeds, including stationary, moving slower, and moving faster. Therefore, it can be inferred that the speedometer in the center appears different from the speedometer on the left.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A speedometer in the center displays different speeds, including stationary, moving slower, and moving faster.", "gt-answer": "C. moving faster", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the first speed displayed on the center speedometer is stationary, while the second speed is slower and the third speed is faster. Therefore, the speedometer in the center appears to be displaying different speeds.", "chatgpt-answer": "B. moving slower.", "video-llm-prediction": "The video showcases a speedometer in the center of the screen, which displays different speeds. The first speed shown is stationary, while the second speed is moving slower, and the third speed is moving faster. The video provides a visual representation of the speedometer's different speeds, making it easy to understand the concept.", "gt-answer": "C. moving faster", "rating": 0 } ] }, "3411806181": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is seen recharging an electric vehicle with a portable charger and then moves on to cleaning the car. After cleaning, the person starts repairing the car with a toolbox. Therefore, the correct answer is C. repairing an electric vehicle.", "chatgpt-answer": "C. repairing an electric vehicle", "video-llm-prediction": "A man is seen recharging an electric vehicle with a portable charger. He connects the charger to the car battery and starts the recharging process. The man then moves to the front of the car and opens the trunk. He takes out a vacuum and starts cleaning the car. After cleaning, he moves to the back of the car and opens the trunk again. This time, he takes out a toolbox and starts repairing the car. The man works on the car for a while before closing the trunk and walking away.", "gt-answer": "A. recharging an electric vehicle", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen recharging an electric vehicle, cleaning the electric vehicle, and repairing the electric vehicle, all with the same charger.", "chatgpt-answer": "D. recharging, cleaning, and repairing an electric vehicle", "video-llm-prediction": "A man is seen recharging an electric vehicle with a portable charger. He then uses the same charger to clean the electric vehicle. Later, he is seen repairing the electric vehicle with the same charger.", "gt-answer": "A. recharging an electric vehicle", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is recharging an electric vehicle with a charger.", "chatgpt-answer": "A. recharging an electric vehicle", "video-llm-prediction": "A man is seen recharging an electric vehicle with a charger.", "gt-answer": "A. recharging an electric vehicle", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the person is recharging an electric vehicle by plugging it into a charging station. It also mentions that the person proceeds to clean the vehicle before driving away.", "chatgpt-answer": "A. recharging an electric vehicle", "video-llm-prediction": "A man is seen recharging an electric vehicle by plugging it into a charging station. He then proceeds to clean the vehicle before driving away.", "gt-answer": "A. recharging an electric vehicle", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description states that the person first plugs the charging gun into the car, then moves it parallel to the car, and finally plugs it back into the car. This indicates that the person is moving the charging gun parallel to the car.", "chatgpt-answer": "B. Parallel to the car", "video-llm-prediction": "A man is seen plugging a charging gun into a car. He then unplugs the charging gun and moves it parallel to the car. Finally, he plugs the charging gun back into the car.", "gt-answer": "C. Towards the car", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is holding the charging gun and moving it parallel to the car.", "chatgpt-answer": "B. Parallel to the car", "video-llm-prediction": "A man is seen plugging a charging gun into a car while another man is holding the charging gun. The man holding the charging gun then moves the charging gun parallel to the car. The video then shows the man plugging the charging gun into the car.", "gt-answer": "C. Towards the car", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person moves the charging gun parallel to the car.", "chatgpt-answer": "B. Parallel to the car", "video-llm-prediction": "A man is seen plugging a charging gun into a car. He then unplugs the charging gun from the car and moves it parallel to the car. Finally, he plugs the charging gun back into the car.", "gt-answer": "C. Towards the car", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the person is moving the charging gun parallel to the car.", "chatgpt-answer": "B. Parallel to the car", "video-llm-prediction": "A man is seen plugging a charging gun into a car, and then unplugging it. The charging gun is then seen moving parallel to the car.", "gt-answer": "C. Towards the car", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video, so we cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen charging his electric car in a parking lot. He uses a portable charger to charge his car. The video shows the process of charging the car and the man's actions.", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video is shot in a normal speed, allowing the viewer to see the details of the process.", "chatgpt-answer": "C. normal speed", "video-llm-prediction": "A man is seen plugging a charger into a car battery while another man is standing next to him. The man then proceeds to plug the charger into his own car battery. The video seems to be showcasing the process of charging a car battery using a charger. The video is shot in a time-lapse format, which allows the viewer to see the entire process in a shorter amount of time. The video is shot in a normal speed, which allows the viewer to see the details of the process. Overall, the video provides a clear and concise demonstration of how to charge a car", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. It only describes the actions of a man charging his electric car. Therefore, we cannot determine the speed of the video based on the information provided.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen charging his electric car in a parking lot. He uses a portable charger to connect to his car and then uses a regular charger to charge the car. The video shows the process of charging the car and the man's actions throughout the process.", "gt-answer": "B. slow motion", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. Therefore, we cannot determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A man is seen plugging a charger into a car battery while another man is standing next to him. The man then uses the charger to charge the car battery.", "gt-answer": "B. slow motion", "rating": 0 } ] }, "1043054206": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the yellow car is driving at different speeds, including driving faster than other cars, driving at the same speed as other cars, and driving slower than other cars. This means that the correct answer should be an option that describes the car's speed in comparison to other cars.", "chatgpt-answer": "C. Driving at the same speed as other cars.", "video-llm-prediction": "The video shows a yellow car driving on a highway with other cars. The car is seen driving at different speeds, including stopped, driving faster than other cars, driving at the same speed as other cars, and driving slower than other cars. The video also shows the car driving through a canyon and a tunnel.", "gt-answer": "B. Driving faster than other cars", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the yellow car is seen driving at different speeds, including being stopped, driving faster than other cars, and driving at the same speed as other cars.", "chatgpt-answer": "B. Driving faster than other cars", "video-llm-prediction": "The video shows a yellow car driving on a highway with other cars. The car is seen driving at different speeds, including stopped. The video also shows the car driving faster than other cars and at the same speed as other cars.", "gt-answer": "B. Driving faster than other cars", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the yellow car is seen driving at the same speed as other cars, faster than other cars, and slower than other cars.", "chatgpt-answer": "C. Driving at the same speed as other cars", "video-llm-prediction": "A yellow car is seen driving on a highway with other cars. The car is seen driving at the same speed as other cars, and then it is seen driving faster than other cars. The car is also seen driving slower than other cars.", "gt-answer": "B. Driving faster than other cars", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the yellow car is initially stopped, but later it is seen driving at the same speed as the other cars and also driving slower than them. This means that the correct answer is D. Driving slower than other cars, as it mentions both scenarios described in the video.", "chatgpt-answer": "D. Driving slower than other cars", "video-llm-prediction": "The yellow car is seen driving on a highway with other cars. It is initially stopped, but later, it is seen driving faster than the other cars. The video captures the car driving at the same speed as the other cars and also driving slower than them.", "gt-answer": "B. Driving faster than other cars", "rating": 0 } ] }, "1096238125": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that the man and woman are doing sit-ups together in a gym.", "chatgpt-answer": "A. doing sit-ups", "video-llm-prediction": "The video shows a man and woman doing sit-ups together in a gym. They are both wearing workout clothes and appear to be in good physical shape. The woman is wearing a ponytail and the man is wearing a beard. The gym is well-lit and has several pieces of equipment visible in the background. The video ends with the woman finishing her sit-ups and the man clapping.", "gt-answer": "C. lifting weights", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man and woman are seen doing sit-ups, jumping rope, lifting weights, and doing push-ups.", "chatgpt-answer": "A. doing sit-ups, B. jumping rope, C. lifting weights, D. doing push-ups", "video-llm-prediction": "The video shows a man and woman performing various exercises in a gym. They are seen doing sit-ups, jumping rope, lifting weights, and doing push-ups. The video emphasizes the importance of physical fitness and the benefits of incorporating exercise into one's daily routine.", "gt-answer": "C. lifting weights", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man and woman are doing sit-ups in a gym.", "chatgpt-answer": "A. doing sit-ups", "video-llm-prediction": "The video shows a man and woman doing sit-ups in a gym.", "gt-answer": "C. lifting weights", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the man and woman are doing sit-ups in a gym. Additionally, it describes their attire, the presence of a mat for support, their focus on their workout, and the absence of any conversation between them, all of which align with the activity of doing sit-ups.", "chatgpt-answer": "A. doing sit-ups", "video-llm-prediction": "The man and woman are seen doing sit-ups in a gym. They are dressed in workout clothes and are using a mat for support. The man is wearing a grey shirt and the woman is wearing a blue shirt. The gym is well-lit and has a variety of equipment in the background. The man and woman are both focused on their workout and are not speaking to each other.", "gt-answer": "C. lifting weights", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description mentions that the man lifts the barbell while the woman continues to lift it. It doesn't explicitly mention the speed at which they are lifting the kettlebell.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman performing a weightlifting exercise in a gym. The woman is seen lifting a barbell while the man is standing next to her. The man then lifts the barbell while the woman continues to lift it. The video emphasizes the importance of proper form and technique when lifting weights.", "gt-answer": "A. At roughly the same speed as the woman", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is lifting a barbell while the man is standing next to her, implying that they are performing the exercise at the same time. However, the video does not provide any details about the speed or pace at which they are lifting the barbell. Therefore, there is not enough information to determine how the man is lifting the kettlebell compared to the woman.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a man and a woman performing a weightlifting exercise in a gym. The woman is seen lifting a barbell while the man is standing next to her. The video emphasizes the importance of proper form and technique when lifting weights.", "gt-answer": "A. At roughly the same speed as the woman", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man and woman are both seen lifting weights, but it does not provide any information about their relative speeds. Therefore, we cannot determine how the man is lifting the kettlebell compared to the woman based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman performing a weightlifting exercise. The woman is seen lifting a barbell while the man is standing next to her. The video also shows the man lifting a dumbbell while the woman is standing next to him. The video ends with the man and woman standing next to each other.", "gt-answer": "A. At roughly the same speed as the woman", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man and woman are both performing squats in the gym. However, it does not provide any information about the speed at which they are lifting the kettlebell. Therefore, based on the given information, we cannot determine how the man is lifting the kettlebell compared to the woman.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman performing squats in a gym. The woman is wearing a blue shirt and black tights, while the man is wearing a grey shirt and black shorts. The woman is seen performing squats alone, while the man is doing squats with the woman. The video also shows the man doing squats alone.", "gt-answer": "A. At roughly the same speed as the woman", "rating": 0 } ] }, "1103088481": { "action": [ { "chatgpt-reasoning": "The video description mentions that the man is seen selecting and purchasing vegetables, putting them into his cart, and then pushing the cart to the cash register. Therefore, it can be inferred that he is buying vegetables.", "chatgpt-answer": "D. buying vegetables", "video-llm-prediction": "A man is seen pushing a cart through a grocery store, selecting and purchasing vegetables. He is shown putting the vegetables into his cart and then pushing the cart to the cash register to make his purchase.", "gt-answer": "D. buying vegetables", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man is picking up vegetables and putting them in his cart. Then, he checks out and leaves the store. This indicates that the person is buying vegetables.", "chatgpt-answer": "D. buying vegetables", "video-llm-prediction": "A man is seen pushing a cart through a grocery store, picking up vegetables and putting them in his cart. He then proceeds to check out and leaves the store.", "gt-answer": "D. buying vegetables", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen shopping in a grocery store, selecting and purchasing vegetables. Therefore, the correct answer is D. buying vegetables.", "chatgpt-answer": "D. buying vegetables", "video-llm-prediction": "A man is seen shopping in a grocery store, pushing a cart down the aisle. He is seen selecting and purchasing vegetables, including tomatoes and apples. The video showcases the man's shopping experience in the grocery store.", "gt-answer": "D. buying vegetables", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is \"selecting and purchasing vegetables\" in a grocery store. This indicates that he is buying vegetables.", "chatgpt-answer": "D. buying vegetables", "video-llm-prediction": "A man is seen pushing a cart through a grocery store, selecting and purchasing vegetables. He is seen pushing the cart through the store, selecting and purchasing vegetables.", "gt-answer": "D. buying vegetables", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description clearly states the order of events as follows:", "chatgpt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "video-llm-prediction": "A man is seen pushing a shopping cart down an aisle in a grocery store. He is seen placing green vegetables into the cart and then placing a black vegetables into the cart. He then continues to push the cart down the aisle and places a yellow vegetables into the cart. Finally, he places a red vegetables into the cart.", "gt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man first picks up a green vegetable and places it into the cart, then picks up a black vegetable and places it into the cart. The process is repeated with a yellow vegetable and a red vegetable.", "chatgpt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "video-llm-prediction": "A man is seen pushing a shopping cart down an aisle, picking up a green vegetable and placing it into the cart. He then picks up a black vegetable and places it into the cart. The man repeats this process with a yellow vegetable and a red vegetable.", "gt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the person first picks up a green vegetable and places it in the cart, then picks up a black vegetable and places it in the cart. They repeat this process with a yellow vegetable and a red vegetable. Therefore, the correct order of events in the video is placing a green vegetable into the trolley and then placing a black vegetable into the trolley.", "chatgpt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "video-llm-prediction": "A person is seen shopping in a supermarket, pushing a shopping cart down the aisle. They pick up a green vegetable and place it in the cart, then pick up a black vegetable and place it in the cart. They repeat this process with a yellow vegetable and a red vegetable.", "gt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the person first places green vegetables into the cart, then places black vegetables into the cart, followed by placing yellow vegetables and finally red vegetables.", "chatgpt-answer": "C. Placing a green vegetables into the trolley, followed by placing a yellow vegetables into the trolley", "video-llm-prediction": "A person is seen pushing a shopping cart down an aisle in a grocery store. They are seen placing green vegetables into the cart and then placing a black vegetables into the cart. The person then continues to place vegetables into the cart, including a yellow vegetables and a red vegetables.", "gt-answer": "A. Placing a green vegetables into the trolley and then placing a black vegetables into the trolley", "rating": 0 } ] }, "1055981522": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the white cubes are spinning and turning into triangles. Then, the cubes turn into spheres and begin to melt. Therefore, the correct answer is B. turning into triangles.", "chatgpt-answer": "B. turning into triangles", "video-llm-prediction": "The video shows a group of white cubes that are spinning and turning into triangles. The cubes then turn into spheres and begin to melt.", "gt-answer": "C. turning into spheres", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the white cube is transformed into a white ball. There is no mention of the cubes disappearing, turning into triangles, or melting. The correct answer is that the white cubes are turning into spheres.", "chatgpt-answer": "C. turning into spheres", "video-llm-prediction": "The video features a white cube that is shown in various positions and angles. The cube is then transformed into a white ball and begins to spin rapidly. The video ends with the white ball exploding.", "gt-answer": "C. turning into spheres", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the white cubes disappear, turn into triangles, and then turn into spheres. It also mentions that the video ends with the cubes melting.", "chatgpt-answer": "D. melting", "video-llm-prediction": "A video of white cubes that disappear, turn into triangles, and then turn into spheres. The video ends with the cubes melting.", "gt-answer": "C. turning into spheres", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the white cubes are shown melting and turning into triangles, then turning into spheres and melting again. Therefore, the correct answer is D. melting.", "chatgpt-answer": "D. melting", "video-llm-prediction": "The video features a group of white cubes that are shown melting and turning into triangles. The cubes are then shown turning into spheres and melting again. The video ends with the cubes turning into triangles once more.", "gt-answer": "C. turning into spheres", "rating": 0 } ] }, "1061017846": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the boat is seen moving at different speeds, with some shots showing it moving faster than others. This implies that the speed of the boat on the top of the screen may be different from the speed of the boat on the bottom of the screen.", "chatgpt-answer": "It cannot be determined based on the given information.", "video-llm-prediction": "The video shows a boat moving through the water, with the camera capturing the boat from different angles. The boat is seen moving at different speeds, with some shots showing it moving faster than others. The video also includes a shot of the boat from a distance, with the water and sky in the background. Overall, the video provides a detailed view of the boat's movement and its surroundings.", "gt-answer": "C. travels at the same speed as the boat on the bottom of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the boat is seen moving at different speeds. However, it does not specifically state the speed of the boat on the top of the screen in relation to the boat on the bottom of the screen or whether they travel at the same speed. Therefore, there is not enough information to determine the correct answer.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a boat moving through the water, with the camera capturing the boat from different angles. The boat is seen moving at different speeds, with some shots showing it moving faster than others. The video also includes a shot of the boat from a distance, with the water and sky in the background. Overall, the video provides a detailed view of the boat's movement and its surroundings.", "gt-answer": "C. travels at the same speed as the boat on the bottom of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the boat is seen moving at different speeds, with some shots showing it moving faster than others. Therefore, the speed of the boat on the top of the screen could be either slower or faster than the boat on the bottom of the screen, depending on the specific shot being shown.", "chatgpt-answer": "Either A. slower than the boat on the bottom of the screen or B. faster than the boat on the bottom of the screen.", "video-llm-prediction": "A boat is seen traveling on the water, with the camera capturing its movement from different angles. The boat is seen moving at different speeds, with some shots showing it moving faster than others. The video provides a detailed view of the boat's movement on the water, with the camera capturing its every movement.", "gt-answer": "C. travels at the same speed as the boat on the bottom of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the boat on the top of the screen is seen moving at a slower pace than the boat on the bottom of the screen.", "chatgpt-answer": "A. slower than the boat on the bottom of the screen", "video-llm-prediction": "The video showcases a boat traveling at a slower speed than another boat on the water. The boat on the top of the screen is seen moving at a slower pace than the boat on the bottom of the screen. The video captures the serene beauty of the water and the tranquility of the surroundings.", "gt-answer": "C. travels at the same speed as the boat on the bottom of the screen", "rating": 0 } ] }, "1097341567": { "order": [ { "chatgpt-reasoning": "The video description mentions that the video starts with a bar chart, followed by an arrow. It then shows the arrow again before ending with the bar chart. This indicates that the bars appear first and then the arrow appears.", "chatgpt-answer": "B. The bars appear, then the arrow appears", "video-llm-prediction": "The video starts with a bar chart, which is then followed by an arrow. The arrow is shown again, and the video ends with the bar chart. The video seems to be related to the bar chart, and the arrow could be a symbol of progress or movement. The video could be related to a business or financial context, where the bar chart represents data or performance metrics, and the arrow represents growth or improvement. The video could be used for marketing or promotional purposes, to showcase the progress or success of a product or service.", "gt-answer": "B. The bars appear, then the arrow appears", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, it states that the video shows a bar chart with a green arrow pointing upwards, and also includes a white arrow pointing downwards. This implies that both the arrows and the bars appear in the video.", "chatgpt-answer": "C. They both appear at the same time", "video-llm-prediction": "The video shows a bar chart with a green arrow pointing upwards. The video also includes a white arrow pointing downwards. The video is about the bar chart and its significance.", "gt-answer": "B. The bars appear, then the arrow appears", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the video shows a bar chart followed by an arrow pointing upwards. This implies that the bars appear first and then the arrow appears.", "chatgpt-answer": "B. The bars appear, then the arrow appears", "video-llm-prediction": "A bar chart is shown, followed by an arrow pointing upwards. The video then shows a graph with a bar chart.", "gt-answer": "B. The bars appear, then the arrow appears", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically mentions that the arrow is shown before the second bar chart. This indicates that the arrow appears first, followed by the bars.", "chatgpt-answer": "A. The arrow appears, then the bars appear", "video-llm-prediction": "The video features a bar chart, which is shown before an arrow. The arrow is then followed by another bar chart. The video ends with the bar chart being shown again.", "gt-answer": "B. The bars appear, then the arrow appears", "rating": 0 } ] }, "1056433484": { "direction": [ { "chatgpt-reasoning": "The video description explicitly states that the subject is the Earth and the direction is counter-clockwise.", "chatgpt-answer": "A. Counter-clockwise", "video-llm-prediction": "A video shows a black and white screen with a black dot moving around in a circle. The dot is seen moving in different directions, including counter-clockwise, clockwise, and upwards. The video also includes a piece of information that states the subject is the earth and the direction is counter-clockwise.", "gt-answer": "A. Counter-clockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the Earth is spinning in different directions, including counter-clockwise and clockwise, but it does not mention anything about the Earth's motion around the Sun. Therefore, we cannot determine the direction of the Earth's motion around the Sun based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the earth spinning in different directions, including counter-clockwise, clockwise, and upwards. The video also features a black ball moving around the screen and a black and white screen with a black ball on it.", "gt-answer": "A. Counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the Earth is spinning in different directions, but it does not provide any information about the Earth's motion around the Sun. Therefore, we cannot determine the direction of the Earth's motion around the Sun based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows the earth spinning in different directions, including counter-clockwise, clockwise, and upwards. The information provided is not consistent with the video content.", "gt-answer": "A. Counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the Earth rotates in a clockwise direction. However, it does not provide any information about the Earth's motion around the Sun or its direction.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a black ball moving in a net of points, while the earth rotates in the background. The ball moves in a counter-clockwise direction, and the earth rotates in a clockwise direction. The video also shows the earth moving upwards.", "gt-answer": "A. Counter-clockwise", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description states that the earth is shown moving faster than the sun, slower than the sun, and at the same speed as the sun. Since the information presented is not consistent, it is not possible to determine the actual speed of the earth's rotation compared to the sun.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows the earth moving faster than the sun, slower than the sun, and at the same speed as the sun. The information presented is not consistent with the video.", "gt-answer": "A. Faster than the sun", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the earth is moving at different speeds, with one instance showing it moving faster than the sun. This implies that the speed of the earth's rotation is faster than the sun.", "chatgpt-answer": "A. Faster than the sun", "video-llm-prediction": "The video showcases the earth moving at different speeds, with one instance showing it moving faster than the sun. The video also features a black ball moving in front of the earth, and a black and white screen with a black ball on it.", "gt-answer": "A. Faster than the sun", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the earth is moving faster than the sun.", "chatgpt-answer": "A. Faster than the sun", "video-llm-prediction": "The video shows the earth moving faster than the sun.", "gt-answer": "A. Faster than the sun", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the earth is shown moving at different speeds compared to the sun. Specifically, it states that there are instances where the earth is shown moving faster than the sun and slower than the sun.", "chatgpt-answer": "C. The same as the sun", "video-llm-prediction": "The video showcases the earth moving at different speeds, with one instance showing it moving faster than the sun and another showing it moving slower than the sun. The video also features a black ball moving around the screen, which could be a representation of the earth's movement. The video's purpose is to highlight the earth's movement and its significance in the universe.", "gt-answer": "A. Faster than the sun", "rating": 0 } ] }, "1073914229": { "direction": [ { "chatgpt-reasoning": "The video description explicitly states that the two trains are traveling in opposite directions on the same track.", "chatgpt-answer": "C. in opposite directions", "video-llm-prediction": "The video shows two trains traveling in opposite directions on the same track. The first train is red and white, while the second train is silver and red. The video also shows a green field with trees in the background.", "gt-answer": "C. in opposite directions", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the two trains are traveling in opposite directions.", "chatgpt-answer": "C. in opposite directions", "video-llm-prediction": "The video showcases two trains traveling in opposite directions on parallel tracks, surrounded by lush green fields and trees. The serene landscape and the smooth movement of the trains create a calming and picturesque scene.", "gt-answer": "C. in opposite directions", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the two trains are moving in opposite directions on the same track.", "chatgpt-answer": "C. in opposite directions", "video-llm-prediction": "The video shows two trains traveling in opposite directions on the same track. The first train is seen moving in the same direction as the information A, while the second train is moving in the opposite direction as the information B. The video captures the movement of the trains as they pass each other on the track.", "gt-answer": "C. in opposite directions", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the train is moving in the same direction as the trees.", "chatgpt-answer": "A. in the same direction", "video-llm-prediction": "A train is seen traveling down the tracks, passing by a field of green trees. The train is moving in the same direction as the trees.", "gt-answer": "C. in opposite directions", "rating": 0 } ] }, "1099360359": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the train in the foreground (closer to the screen) is moving faster than the one in the background. Therefore, the correct answer is A. The train closer to the screen.", "chatgpt-answer": "A. The train closer to the screen", "video-llm-prediction": "The video showcases two trains, one closer to the camera and the other further away. The train in the foreground is moving faster than the one in the background. The video emphasizes the contrast between the two trains and their respective speeds.", "gt-answer": "D. The train further away from the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that \"The train in the foreground is moving faster than the one in the background.\" This indicates that the train closer to the screen is the one driving faster.", "chatgpt-answer": "A. The train closer to the screen", "video-llm-prediction": "The video showcases two trains, one closer to the camera and the other further away. The train in the foreground is moving faster than the one in the background. The video emphasizes the contrast between the two trains, with the closer train appearing larger and more prominent in the frame. The video captures the movement and speed of the trains, providing a sense of motion and excitement.", "gt-answer": "D. The train further away from the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"The train parked further away is moving faster than the closer train.\"", "chatgpt-answer": "D. The train further away from the screen", "video-llm-prediction": "The video shows a train station with two trains parked on the tracks. One train is parked closer to the camera, while the other is parked further away. The train parked further away is moving faster than the closer train.", "gt-answer": "D. The train further away from the screen", "rating": 1 }, { "chatgpt-reasoning": "The video description states that \"The train in the foreground is moving faster than the one in the background.\"", "chatgpt-answer": "A. The train closer to the screen", "video-llm-prediction": "The video showcases two trains, one closer to the camera and the other further away. The train in the foreground is moving faster than the one in the background. The video captures the essence of the train's motion and the contrast between the two trains.", "gt-answer": "D. The train further away from the screen", "rating": 0 } ] }, "1098970151": { "action": [ { "chatgpt-reasoning": "The video description mentions that the cat is seen licking its paw, waving its paw, and biting its paw. This indicates that the cat is primarily focused on its paw throughout the video.", "chatgpt-answer": "A. licking its paw", "video-llm-prediction": "A cat is seen licking its paw while laying on a bed. The cat then waves its paw and watches it. The cat then bites its paw and licks it.", "gt-answer": "A. licking its paw", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the cat is seen licking its paw, waving its paw, and watching its paw in the video.", "chatgpt-answer": "A. licking its paw", "video-llm-prediction": "A cat is seen licking its paw, waving its paw, and watching its paw in a video.", "gt-answer": "A. licking its paw", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the cat is licking its paw, so option A is the correct answer.", "chatgpt-answer": "A. licking its paw", "video-llm-prediction": "A cat is seen licking its paw while lying on a bed.", "gt-answer": "A. licking its paw", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the cat is seen licking its paw while laying on a bed and then waves its paw and watches it.", "chatgpt-answer": "C. waving its paw", "video-llm-prediction": "A cat is seen licking its paw while laying on a bed. The cat then waves its paw and watches it.", "gt-answer": "A. licking its paw", "rating": 0 } ] }, "1081734740": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the video includes several shots of the leaf, highlighting its texture and color changes. Since the focus is on the texture changes of the leaf, it can be inferred that the texture of the leaf is changing.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the natural process of a leaf changing color from green to yellow. The video starts with a close-up shot of a leaf, and then it shows the leaf turning from green to yellow. The video also includes several shots of the leaf, highlighting its texture and color changes. The video provides a detailed view of the leaf's transformation, making it an excellent resource for anyone interested in the natural process of a leaf changing color.", "gt-answer": "A. It is turning from green to yellow", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the camera captures the leaf's texture and color, highlighting the gradual transformation from green to yellow. This indicates that the texture of the leaf is changing from green to yellow.", "chatgpt-answer": "A. It is turning from green to yellow", "video-llm-prediction": "The video showcases the natural process of a leaf changing from green to yellow. The camera captures the leaf's texture and color, highlighting the gradual transformation from green to yellow. The video emphasizes the beauty and complexity of the natural world, inspiring viewers to appreciate the intricacies of nature.", "gt-answer": "A. It is turning from green to yellow", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the leaf is changing its color from green to yellow and then to white. However, there is no information provided about the texture of the leaf.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the changing colors of a leaf, starting from green to yellow and then to white. The video provides a close-up view of the leaf, highlighting its texture and color changes.", "gt-answer": "A. It is turning from green to yellow", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the leaf is changing colors, starting from green to yellow and then to white. Therefore, the texture of the leaf is turning from green to white.", "chatgpt-answer": "C. It is turning from green to white", "video-llm-prediction": "The video showcases the changing colors of a leaf, starting from green to yellow and then to white. The video emphasizes the beauty of nature and the changing colors of leaves.", "gt-answer": "A. It is turning from green to yellow", "rating": 0 } ] }, "1093719871": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the pink flowers are growing from withered to full blossom and then turning from full blossom to withered. The video also shows the process of the flowers growing taller and falling off petals.", "chatgpt-answer": "C. turning from withered to full blossom", "video-llm-prediction": "The video showcases the process of pink flowers growing from withered to full blossom and then turning from full blossom to withered. The video starts with a close-up shot of pink flowers, and then it transitions to a wider shot of the flowers. The flowers are shown growing taller and turning from withered to full blossom. The video then shows the flowers turning from full blossom to withered. The video ends with a shot of the flowers falling off petals.", "gt-answer": "C. turning from withered to full blossom", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the pink flowers are turning from full blossom to withered. This means that the flowers are going through a process where they lose their petals and become withered.", "chatgpt-answer": "D. turning from full blossom to withered", "video-llm-prediction": "The video showcases the process of pink flowers turning from full blossom to withered. The video starts with a close-up shot of the flowers, and then it transitions to a wider shot of the flowers. The flowers are shown in various stages of blossoming, from full bloom to withered. The video highlights the beauty of the flowers and the process of their life cycle. The video is a great representation of the beauty of nature and the cycle of life.", "gt-answer": "C. turning from withered to full blossom", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the pink flowers are initially withered but later turn into full blossom. This means that the flowers are undergoing a transformation from withered to full blossom.", "chatgpt-answer": "C. turning from withered to full blossom", "video-llm-prediction": "The video showcases a group of pink flowers that are initially withered but later turn into full blossom. The flowers are seen growing taller and turning from withered to full blossom.", "gt-answer": "C. turning from withered to full blossom", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the pink flowers are turning from full blossom to withered.", "chatgpt-answer": "D. turning from full blossom to withered", "video-llm-prediction": "The video showcases the process of pink flowers turning from full blossom to withered. The video starts with a close-up shot of the flowers, and then it transitions to a wider shot of the flowers. The flowers are shown in various stages of blossoming, from full bloom to withered. The video highlights the beauty of the flowers and the process of their life cycle. The video is a great representation of the beauty of nature and the cycle of life.", "gt-answer": "C. turning from withered to full blossom", "rating": 0 } ] }, "1042819039": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the video includes a time-lapse effect, which shows the same scene but at a faster pace.", "chatgpt-answer": "B. time-lapse", "video-llm-prediction": "The video shows a busy intersection with many people crossing the street. The camera captures the bustling scene from various angles, highlighting the movement and energy of the city. The video also includes a time-lapse effect, which shows the same scene but at a faster pace. The camera captures the people crossing the street, the cars driving by, and the sounds of the city. The video ends with a shot of the intersection at night, with the lights of the city illuminating the scene.", "gt-answer": "B. time-lapse", "rating": 1 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the video. It only describes the scene and the movement of people and cars. Therefore, we cannot determine the speed of the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a busy intersection with a large crowd of people walking around. The camera captures the bustling scene from above, and the sound of the crowd can be heard in the background. The camera then pans to the right, revealing a car driving down the street. The car is surrounded by the crowd, and the camera captures the movement of the people around it. The video then pans to the left, revealing a car driving down the street. The car is surrounded by the crowd, and the camera captures the movement of the people around it. The video then pans to the right,", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the video. We can assume that the video is filmed in normal speed, as it captures the movement of the crowd and cars in real-time.", "chatgpt-answer": "C. normal speed", "video-llm-prediction": "A busy intersection with a large crowd of people crossing the street. The camera captures the scene from above, showing the movement of the crowd and the cars driving through the intersection.", "gt-answer": "B. time-lapse", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the video is shot in slow motion, highlighting the movement of people and vehicles.", "chatgpt-answer": "A. slow motion", "video-llm-prediction": "The video captures a busy intersection with people crossing the street. The camera pans around the intersection, showing the bustling activity. The video is shot in slow motion, highlighting the movement of people and vehicles.", "gt-answer": "B. time-lapse", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description clearly states that the street was first filled with vehicles and then with people.", "chatgpt-answer": "C. The street was filled with vehicles, then it was filled with people", "video-llm-prediction": "The video shows a busy street filled with both vehicles and people. The street is first filled with vehicles, and then with people. The video captures the hustle and bustle of the city, with people walking and cars driving. The street is a hub of activity, with people going about their daily routines. The video provides a glimpse into the life of a bustling city, where people and vehicles coexist in a chaotic yet vibrant environment.", "gt-answer": "A. The street was filled with people, then it was filled with vehicles", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the street was first filled with vehicles and then with people. It mentions the movement of both vehicles and people, indicating that the vehicles were present before the people.", "chatgpt-answer": "C. The street was filled with vehicles, then it was filled with people", "video-llm-prediction": "The video captures a busy street filled with both vehicles and people. The street is first filled with vehicles, and then with people. The scene is bustling with activity, and the camera captures the movement of both vehicles and people. The video provides a glimpse into the hustle and bustle of city life, showcasing the constant movement and energy of the urban environment.", "gt-answer": "A. The street was filled with people, then it was filled with vehicles", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"The street is first filled with vehicles, and then with people.\" This implies that the events occurred in the order of vehicles first, followed by people.", "chatgpt-answer": "C. The street was filled with vehicles, then it was filled with people", "video-llm-prediction": "The video shows a busy street filled with people and vehicles. The street is first filled with vehicles, and then with people. The video captures the hustle and bustle of the city, with people walking and vehicles driving. The street is a hub of activity, with people going about their daily lives. The video provides a glimpse into the fast-paced nature of city life, where people and vehicles coexist in a constant state of motion.", "gt-answer": "A. The street was filled with people, then it was filled with vehicles", "rating": 0 }, { "chatgpt-reasoning": "The video starts with the street being empty, and as the camera pans out, we see people walking around and vehicles driving on the street. Therefore, the events occurred in the following order: the street was initially empty, then it was filled with people and vehicles.", "chatgpt-answer": "A. The street was filled with people, then it was filled with vehicles", "video-llm-prediction": "The video captures a busy street filled with both vehicles and people. The street is initially empty, but as the camera pans out, we see people walking around and vehicles driving on the street. The street is bustling with activity, and the camera captures the movement of both people and vehicles. The video provides a glimpse into the daily life of a busy street, showcasing the hustle and bustle of city life.", "gt-answer": "A. The street was filled with people, then it was filled with vehicles", "rating": 1 } ] }, "1093139559": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera starts with zooming in on three men, then pans to the left and pans to the right, showing the entire field.", "chatgpt-answer": "C. Panning right", "video-llm-prediction": "The video starts with three men walking onto a field, and the camera zooms in on them. The men are wearing red jerseys and white shorts, and they seem to be preparing for a game. The camera then pans to the left, showing the entire field. The men are seen walking towards the center of the field, where they start playing soccer. The camera then pans to the right, showing the entire field. The men are seen running around, passing the ball to each other, and trying to score a goal. The game seems to be intense, and the men are putting in", "gt-answer": "A. Zooming into three football players", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans to the left and then pans to the right.", "chatgpt-answer": "C. Panning right", "video-llm-prediction": "The video starts with three men standing on a field, and they are all wearing red shirts. The men are seen walking towards the camera, and they seem to be in a hurry. As they walk, the camera pans to the left, and we can see a large crowd of people sitting in the stands. The men continue to walk towards the camera, and we can see that they are heading towards the stands. The camera then pans to the right, and we can see that the men are now standing in front of the crowd. The men seem to be talking to the crowd, and they are all sm", "gt-answer": "A. Zooming into three football players", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera zooms in on the three football players and then pans left and right to show the entire field. The camera then zooms out to show the entire field.", "chatgpt-answer": "D. Zooming out from three football players", "video-llm-prediction": "Three football players are seen walking onto a field, and the camera zooms in on them. The camera then pans left and right, showing the entire field. The players are seen walking around the field, and the camera zooms out to show the entire field.", "gt-answer": "A. Zooming into three football players", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the players walking onto the field, playing, and then walking off the field. It does not mention any zooming in or out. However, it does mention that the players are seen walking towards the center of the field, indicating a panning motion.", "chatgpt-answer": "B. Panning left", "video-llm-prediction": "The video shows three football players walking onto a field, with a crowd cheering them on. The players are seen walking towards the center of the field, where they begin to play. The video captures the excitement and energy of the game, with the players running up and down the field, passing the ball to each other, and scoring goals. The crowd is seen cheering and clapping throughout the game, adding to the overall atmosphere of excitement and energy. The video ends with the players walking off the field, with the crowd still cheering and clapping.", "gt-answer": "A. Zooming into three football players", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description does not mention anything about the light condition on the football players. Therefore, there is not enough information to determine what is happening to the light condition.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows three men walking onto a field, and they are wearing red shirts. The men are seen walking towards the camera, and they are wearing black shorts. The men are seen walking towards the camera, and they are wearing black shorts. The men are seen walking towards the camera, and they are wearing black shorts. The men are seen walking towards the camera, and they are wearing black shorts. The men are seen walking towards the camera, and they are wearing black shorts. The men are seen walking towards the camera, and they are wearing black shorts.", "gt-answer": "C. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the men are wearing red shirts and white shorts, but there is no mention of any changes in light conditions on the football players.", "chatgpt-answer": "A. staying the same", "video-llm-prediction": "The video shows three men walking onto a field, with the audience cheering them on. The men are wearing red shirts and white shorts, and they are seen walking towards the center of the field. The audience is cheering loudly, and the men seem to be enjoying the attention. The men then start playing football, with the audience cheering them on. The men seem to be having a great time, and the audience is enjoying the game as well. The video captures the excitement and energy of the game, with the audience cheering and the men enjoying the game.", "gt-answer": "C. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the lighting changes from dark to bright. This indicates that the light condition on the football players is turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video shows three men walking onto a field, and the lighting changes from dark to bright.", "gt-answer": "C. turning brighter", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the lighting changes from dark to bright. This implies that the light condition on the football players is turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video shows three men walking onto a field, and the lighting changes from dark to bright.", "gt-answer": "C. turning brighter", "rating": 1 } ] }, "1055973887": { "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly states that the fire ball starts small and gradually grows in size.", "chatgpt-answer": "C. getting larger", "video-llm-prediction": "The video shows a fire ball that starts small and gradually grows in size. The fire ball is the subject of the video, and its size changes throughout the video. The fire ball is shown in different positions, including in the air and on the ground. The video captures the fire ball's movement and its gradual growth, making it an interesting and engaging video to watch.", "gt-answer": "C. getting larger", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball starts small and gradually grows in size.", "chatgpt-answer": "C. getting larger", "video-llm-prediction": "The video shows a fire ball that starts small and gradually grows in size. The fire ball is the main subject of the video, and it is the only information that matches the content of the video.", "gt-answer": "C. getting larger", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is seen getting smaller and larger.", "chatgpt-answer": "C. getting larger", "video-llm-prediction": "A fire ball is shown in the video, and it is seen getting smaller and larger.", "gt-answer": "C. getting larger", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is getting both smaller and larger.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A fire ball is shown in the video, and it is seen getting smaller and larger.", "gt-answer": "C. getting larger", "rating": 0 } ] }, "1098710341": { "action": [ { "chatgpt-reasoning": "The video description clearly states that we see a person pouring water into a glass. None of the other choices are consistent with this description.", "chatgpt-answer": "B. pouring water into a glass", "video-llm-prediction": "In the video, we see a person pouring water into a glass, which is consistent with Information B. However, the other information provided is not consistent with the video.", "gt-answer": "B. pouring water into a glass", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is seen performing multiple actions related to water, such as drinking water from a glass, pouring water into a glass, washing hands with water, and spilling water on the floor. Among the given choices, all of these actions are mentioned except for option D (spilling water on the floor).", "chatgpt-answer": "D. spilling water on the floor", "video-llm-prediction": "A person is seen drinking water from a glass, pouring water into a glass, and washing their hands with water. The video also shows a person spilling water on the floor.", "gt-answer": "B. pouring water into a glass", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen drinking water from a glass, pouring water into a glass, washing hands with water, and spilling water on the floor.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen drinking water from a glass, pouring water into a glass, washing hands with water, and spilling water on the floor.", "gt-answer": "B. pouring water into a glass", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen doing multiple activities involving water. These activities include drinking water from a glass, pouring water into a glass, washing their hands with water, and spilling water on the floor.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "A person is seen drinking water from a glass, pouring water into a glass, and washing their hands with water. The video also shows a person spilling water on the floor.", "gt-answer": "B. pouring water into a glass", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the glass is being filled and then emptied. This suggests that the glass is going from full of water to empty.", "chatgpt-answer": "B. It is going from full of water to empty", "video-llm-prediction": "The video shows a glass of water being filled and then emptied. The glass is shown in different positions, including on a table and in a hand. The video also includes a close-up shot of the glass.", "gt-answer": "C. It is going from empty to full of water", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the glass is being filled and drained multiple times, and it ends with the glass being shown empty. From this information, we can conclude that the glass is going from full of water to empty.", "chatgpt-answer": "B. It is going from full of water to empty", "video-llm-prediction": "The video shows a glass of water being filled and then drained, with the glass being shown in different positions throughout the video. The glass is also shown being filled with ice and water, and then drained again. The video ends with the glass being shown empty.", "gt-answer": "C. It is going from empty to full of water", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the glass is being transformed into a different shape.", "chatgpt-answer": "D. It is transforming into a different shape", "video-llm-prediction": "A glass is shown being filled with water and then drained. The video showcases the glass being transformed into a different shape.", "gt-answer": "C. It is going from empty to full of water", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the glass is seen changing from full to empty and then back to full again. It also mentions that the glass is transforming into a different shape.", "chatgpt-answer": "C. It is going from empty to full of water", "video-llm-prediction": "The video shows a glass of water being filled and then emptied. The glass is seen changing from full to empty and then back to full again. The video also shows the glass transforming into a different shape.", "gt-answer": "C. It is going from empty to full of water", "rating": 1 } ] }, "1062736174": { "action": [ { "chatgpt-reasoning": "The video description mentions that the chef is preparing a steak by chopping it up, sprinkling vegetables on it, sprinkling salt on the steak, and grilling it.", "chatgpt-answer": "D. grilling steak", "video-llm-prediction": "A chef is seen preparing a steak by chopping it up and sprinkling vegetables on it. He then sprinkles salt on the steak and grills it.", "gt-answer": "C. sprinkling salt on steak", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the chef is preparing a steak by chopping it up, sprinkling vegetables on top, adding salt, and grilling the steak.", "chatgpt-answer": "A. chopping steak", "video-llm-prediction": "A chef is seen preparing a steak by chopping it up and sprinkling vegetables on top. He then adds salt and grills the steak.", "gt-answer": "C. sprinkling salt on steak", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef is seen preparing a steak by chopping it, sprinkling vegetables on it, and then grilling it.", "chatgpt-answer": "D. grilling steak", "video-llm-prediction": "A chef is seen preparing a steak by chopping it, sprinkling vegetables on it, and then grilling it.", "gt-answer": "C. sprinkling salt on steak", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef is seen preparing a steak by chopping it, sprinkling vegetables and salt on it, grilling it, and serving it on a plate. Therefore, all of the choices A, B, C, and D are correct.", "chatgpt-answer": "All of the choices are correct.", "video-llm-prediction": "A chef is seen preparing a steak by chopping it and sprinkling vegetables and salt on it. He then grills the steak and serves it on a plate.", "gt-answer": "C. sprinkling salt on steak", "rating": 0 } ] }, "1099116143": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the white foam appears on the surface of the pink liquid, then the liquid freezes, and finally, the liquid evaporates. This suggests a sequence of events where the white foam initially forms, followed by the freezing of the liquid, and ultimately the evaporation of the liquid.", "chatgpt-answer": "B. White foam appears on the surface", "video-llm-prediction": "The video shows a close-up of a pink liquid in a glass, with a white foam appearing on the surface. The liquid is then shown freezing, and the foam disappears. The video then shows the liquid evaporating, leaving only the pink liquid behind.", "gt-answer": "B. White foam appears on the surface", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the first description shows the pink liquid with white foam on its surface, while the second description shows the pink liquid with no foam on its surface. This indicates that the white foam disappears from the surface of the pink liquid.", "chatgpt-answer": "A. White foam disappears from the surface", "video-llm-prediction": "The video showcases a close-up of a pink liquid, which is then followed by a series of text descriptions. The first description shows the pink liquid with white foam on its surface, while the second description shows the pink liquid with no foam on its surface. The third description shows the pink liquid freezing, and the fourth description shows the pink liquid evaporating. The video captures the different stages of the pink liquid, from its initial appearance to its eventual transformation. The close-up shots of the pink liquid provide a detailed view of its texture and color, making", "gt-answer": "B. White foam appears on the surface", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the liquid is initially being stirred, then left to sit still. After that, the foam on the surface disappears and the liquid freezes. Finally, the liquid evaporates. Based on this information, it can be concluded that the pink liquid is going through a process of evaporation.", "chatgpt-answer": "D. It is evaporating", "video-llm-prediction": "The video shows a close-up of a pink liquid in a glass, which is being stirred. The liquid is then left to sit still, and the camera zooms in to show the foam on the surface. The foam then disappears, and the liquid is left to freeze. The video ends with the liquid evaporating.", "gt-answer": "B. White foam appears on the surface", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the pink liquid is observed to be freezing and evaporating. It also mentions that there is white foam appearing on the surface of the liquid.", "chatgpt-answer": "B. White foam appears on the surface", "video-llm-prediction": "The video showcases a close-up of a pink liquid, which is then observed to be freezing and evaporating. The video also features a white foam that appears on the surface of the liquid.", "gt-answer": "B. White foam appears on the surface", "rating": 1 } ] }, "1108398787": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is seen chatting on a smartphone device. It also mentions that the device is used to watch videos and play games. Therefore, the correct answer is A. Chatting on a smartphone device.", "chatgpt-answer": "A. Chatting on a smartphone device", "video-llm-prediction": "A person is seen chatting on a smartphone device. The device is then shown with the settings of the operating system. The device is then used to watch videos and play games.", "gt-answer": "B. Operating system settings on a smartphone device", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is chatting on a smartphone device, watching a video, and playing a game. From the given choices, option A (Chatting on a smartphone device) best describes the actions performed by the person in the video.", "chatgpt-answer": "A. Chatting on a smartphone device", "video-llm-prediction": "A person is seen chatting on a smartphone device, with the device's settings being displayed on the screen. The person then watches a video on the device and plays a game.", "gt-answer": "B. Operating system settings on a smartphone device", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen chatting on a smartphone device, then the device is shown with the option to change the settings, and finally the person watches a video on the device. This sequence of actions suggests that the person is performing the action of operating system settings on a smartphone device.", "chatgpt-answer": "B. Operating system settings on a smartphone device", "video-llm-prediction": "A person is seen chatting on a smartphone device. The device is then shown with the option to change the settings. The person then watches a video on the device.", "gt-answer": "B. Operating system settings on a smartphone device", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is seen chatting, operating system settings, watching videos, and playing games on a smartphone device.", "chatgpt-answer": "All of the choices are correct.", "video-llm-prediction": "A person is seen chatting on a smartphone device, followed by operating system settings on the same device. The person then watches videos on the smartphone device, and finally, they play games on the same device.", "gt-answer": "B. Operating system settings on a smartphone device", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that the person is first scrolling down and then entering passwords. After that, the person is shown scrolling up and entering more passwords.", "chatgpt-answer": "D. Entering passwords and then scrolling up", "video-llm-prediction": "A person is shown scrolling down and then entering passwords. The video then shows the person scrolling up and entering more passwords.", "gt-answer": "A. Scrolling down and then entering passwords", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen scrolling down and then entering passwords. They then scroll up and enter more passwords. This indicates that the correct order of events is scrolling down first and then entering passwords.", "chatgpt-answer": "A. Scrolling down and then entering passwords", "video-llm-prediction": "A person is seen scrolling down and then entering passwords. They then scroll up and enter more passwords. The video seems to be a tutorial on how to enter passwords. The person in the video is demonstrating the correct way to enter passwords. The video is informative and helpful for those who are new to entering passwords. The video is shot in a clear and concise manner, making it easy to follow along. Overall, the video is a useful resource for anyone who needs to learn how to enter passwords.", "gt-answer": "A. Scrolling down and then entering passwords", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the person is first scrolling down and then entering passwords.", "chatgpt-answer": "A. Scrolling down and then entering passwords", "video-llm-prediction": "A person is seen scrolling down and then entering passwords.", "gt-answer": "A. Scrolling down and then entering passwords", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the person is first scrolling down and then entering passwords, followed by scrolling up and entering more passwords.", "chatgpt-answer": "A. Scrolling down and then entering passwords", "video-llm-prediction": "A person is seen scrolling down and then entering passwords. They then scroll up and enter more passwords.", "gt-answer": "A. Scrolling down and then entering passwords", "rating": 1 } ] }, "1080591311": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the jellyfish are seen moving towards the right, floating upwards, and sinking downwards.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "The video showcases a group of jellyfish swimming in the ocean. The jellyfish are seen moving towards the right, floating upwards, and sinking downwards. The video captures the beauty and grace of these aquatic creatures as they move through the water.", "gt-answer": "B. floating upwards", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the jellyfish are swimming towards the right.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "The video showcases a group of jellyfish swimming in the ocean. The camera captures the movement of the jellyfish as they swim towards the right. The jellyfish are seen floating upwards and sinking downwards, creating a mesmerizing visual effect. The video highlights the beauty and grace of these aquatic creatures, making it a must-watch for anyone interested in marine life.", "gt-answer": "B. floating upwards", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the jellyfish are moving towards the right.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "A group of jellyfish are seen swimming in the water. They are moving towards the right.", "gt-answer": "B. floating upwards", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that \"some [jellyfish] are moving towards the right and others floating upwards.\" Therefore, the jellyfish are moving in two directions - some towards the right and some floating upwards.", "chatgpt-answer": "A. moving towards the right and B. floating upwards", "video-llm-prediction": "A group of jellyfish are seen swimming in the ocean, with some moving towards the right and others floating upwards. The jellyfish continue to move around in the water.", "gt-answer": "B. floating upwards", "rating": 0 } ] }, "1107034223": { "action": [ { "chatgpt-reasoning": "The video description mentions that the bear is seen swimming in the water, climbing trees, and sleeping in the water. However, it specifically states that the bear is catching a fish in the water, indicating that it is actively engaged in catching fishes.", "chatgpt-answer": "D. catching fishes", "video-llm-prediction": "The video shows a brown bear catching a fish in the water. The bear is seen swimming in the water and climbing trees. The bear is also seen sleeping in the water. The video captures the bear's natural behavior in its habitat.", "gt-answer": "D. catching fishes", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the bear is seen swimming in the water, climbing trees, and catching fishes. This implies that the bear is actively engaged in catching fishes.", "chatgpt-answer": "D. catching fishes", "video-llm-prediction": "A brown bear is seen swimming in the water, climbing trees, and catching fishes. The video showcases the bear's natural behavior in its habitat.", "gt-answer": "D. catching fishes", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the bear is swimming in the water, climbing trees, and catching fishes.", "chatgpt-answer": "D. catching fishes", "video-llm-prediction": "A brown bear is seen swimming in the water, climbing trees, and catching fishes.", "gt-answer": "D. catching fishes", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the bear is seen swimming in the water, climbing trees, and catching fishes.", "chatgpt-answer": "D. catching fishes", "video-llm-prediction": "A brown bear is seen swimming in the water, climbing trees, and catching fishes.", "gt-answer": "D. catching fishes", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "Based on the video description, the bear is first seen running forward and then catching a fish. After catching the fish, the bear swallows it. Finally, the bear turns back.", "chatgpt-answer": "B. Running forward and then catching a fish", "video-llm-prediction": "A brown bear is seen in the video catching a fish in the water. The bear is seen running forward and then catching the fish. The bear then swallows the fish and turns back. The video shows the bear in a natural environment, with the sound of water and the occasional growl of the bear. The bear is seen in different positions, sometimes standing on the shore and other times in the water. The video captures the beauty and power of the bear in its natural habitat.", "gt-answer": "D. Catching a fish and then turning back", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the bear is seen running forward and then catching the fish. Therefore, the correct answer is B. Running forward and then catching a fish.", "chatgpt-answer": "B. Running forward and then catching a fish", "video-llm-prediction": "A brown bear is seen in the video catching a fish in the water. The bear is seen running forward and then catching the fish. It then swallows the fish and turns back. The video showcases the bear's hunting skills and its ability to catch fish in the water. The bear's movements are fluid and graceful, and it appears to be completely in control of the situation. The video provides a glimpse into the natural behavior of bears and their hunting habits. Overall, the video is a fascinating display of the bear's hunting abilities and its ability to catch fish", "gt-answer": "D. Catching a fish and then turning back", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the bear catches a fish in the water, turns back and catches the fish again, swallows the fish, and turns back again. This implies that the correct order of events involving the bear is catching a fish and then turning back.", "chatgpt-answer": "D. Catching a fish and then turning back", "video-llm-prediction": "A brown bear is seen catching a fish in the water. It turns back and catches the fish again. The bear then swallows the fish and turns back again.", "gt-answer": "D. Catching a fish and then turning back", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the bear first catches a fish in the river, then turns back, swallows the fish, and finally turns back again.", "chatgpt-answer": "D. Catching a fish and then turning back", "video-llm-prediction": "A brown bear is seen catching a fish in a river. It turns back and then catches the fish. The bear then swallows the fish and turns back.", "gt-answer": "D. Catching a fish and then turning back", "rating": 1 } ] }, "1025623079": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the skyscraper is being destroyed by an explosion, and it shows the building collapsing in slow motion.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "The video shows a skyscraper that is being destroyed by an explosion. The building is shown in several clips, and the explosion is shown in slow motion. The building is seen collapsing in the video.", "gt-answer": "D. collapsing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the skyscraper is initially dark and then begins to light up. It also states that as the lighting increases, the skyscraper becomes taller and taller. However, the video ends with the skyscraper collapsing.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "The video shows a skyscraper that is initially dark and then begins to light up. As the lighting increases, the skyscraper becomes taller and taller. However, the video ends with the skyscraper collapsing.", "gt-answer": "D. collapsing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the skyscraper is seen growing taller and then collapsing.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "A skyscraper is shown in the video, and it is seen growing taller and then collapsing.", "gt-answer": "D. collapsing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the skyscraper is seen growing taller and then collapsing. It implies that the skyscraper is experiencing a process of getting bigger and then falling down.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "A skyscraper is shown in the video, and it is seen growing taller and then collapsing.", "gt-answer": "D. collapsing", "rating": 1 } ] }, "1094782389": { "action": [ { "chatgpt-reasoning": "The video description states that the dog runs towards the woman and jumps on her. This indicates that the correct answer is the action of \"Jumping towards a woman.\"", "chatgpt-answer": "B. Jumping towards a woman", "video-llm-prediction": "A woman is seen petting a dog in a park. The dog then runs towards the woman and jumps on her. The woman then pets the dog and the dog licks her hand. The video showcases the bond between a woman and her furry friend.", "gt-answer": "D. Giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dog is running towards a woman, jumping towards her, and barking at her. There is no mention of the dog giving a high five to the woman.", "chatgpt-answer": "A. Running towards a woman", "video-llm-prediction": "A dog is seen running towards a woman, jumping towards her, and barking at her. The woman then gives the dog a high five.", "gt-answer": "D. Giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the dog is running towards a woman, jumping towards her, and barking. There is no mention of the dog giving a high five to the woman.", "chatgpt-answer": "A. Running towards a woman", "video-llm-prediction": "A dog is seen running towards a woman, jumping towards her, and barking. The woman then gives the dog a high five.", "gt-answer": "D. Giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dog is running towards a woman, jumping towards her, and barking to her. There is no mention of the dog giving a high five to the woman.", "chatgpt-answer": "B. Jumping towards a woman", "video-llm-prediction": "A dog is seen running towards a woman, jumping towards her, and barking to her. The woman then gives the dog a high five.", "gt-answer": "D. Giving a high five to a woman", "rating": 0 } ] }, "3411228673": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans up and down, capturing the city's skyline and the bustling activity below. This suggests that the movement in the video is either upwards or downwards.", "chatgpt-answer": "B. upwards among skyscraper buildings", "video-llm-prediction": "The video showcases a city with tall buildings and a busy street. The camera pans up and down, capturing the city's skyline and the bustling activity below. The video also includes a shot of a large building with a sign that reads \"the world's tallest building.\" Overall, the video provides a stunning view of the city and its architecture.", "gt-answer": "B. upwards among skyscraper buildings", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans upwards and downwards, providing a comprehensive view of the city. This means that the movement is happening vertically, either going upwards or downwards.", "chatgpt-answer": "B. upwards among skyscraper buildings", "video-llm-prediction": "The video showcases a cityscape with skyscrapers and a busy street filled with traffic. The camera pans upwards and downwards, providing a comprehensive view of the city. The video captures the hustle and bustle of the city, with cars and people moving about. The camera also captures the surrounding buildings, showcasing the city's architecture. The video provides a glimpse into the city's daily life, highlighting the city's vibrant energy.", "gt-answer": "B. upwards among skyscraper buildings", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans down to show the city from a lower angle and then pans upwards to show the city from a higher angle. This indicates that the movement in the video is vertical, either upwards or downwards.", "chatgpt-answer": "C. downwards towards the ground", "video-llm-prediction": "A video showcasing the cityscape of a city with skyscrapers and a mountain in the background. The video starts with a view of the city from the top of a skyscraper, then pans down to show the city from a lower angle. The camera then pans upwards to show the city from a higher angle. The video ends with a view of the city from the top of a skyscraper.", "gt-answer": "B. upwards among skyscraper buildings", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans upwards, downwards, and sideways to capture the entire scene. This indicates that the camera is moving in multiple directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a cityscape with skyscrapers and a road running through it. The camera pans upwards, downwards, and sideways to capture the entire scene.", "gt-answer": "B. upwards among skyscraper buildings", "rating": 0 } ] }, "1043487715": { "action": [ { "chatgpt-reasoning": "The video description mentions that the children are swimming in a pool and playing with a ball and a frisbee. It does not mention anything about diving into water, eating or sleeping.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of children swimming in a pool. One of the children is seen swimming underwater while the others are swimming on the surface. The children are also seen playing with a ball and a frisbee. The video captures the children's playful and carefree nature as they enjoy their time in the pool.", "gt-answer": "A. diving into water", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the children are swimming in a pool, not diving into water, eating or sleeping.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of children are seen swimming in a pool, with one of them holding onto another. The video captures the children's playful and carefree nature as they enjoy the water.", "gt-answer": "A. diving into water", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the children are seen diving into the water and swimming around.", "chatgpt-answer": "A. diving into water", "video-llm-prediction": "A group of children are seen swimming in a pool. They are seen diving into the water and swimming around.", "gt-answer": "A. diving into water", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the children are swimming in a pool and having a great time. This implies that they are engaging in some water activity, not eating or sleeping.", "chatgpt-answer": "A. diving into water", "video-llm-prediction": "A group of children are seen swimming in a pool, with one of them holding onto another. They are all smiling and having a great time.", "gt-answer": "A. diving into water", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description mentions that one of the children is seen diving into the water and then making gestures to the camera. So, the correct order of events is \"diving into water and then making gestures to the camera\".", "chatgpt-answer": "A. diving into water and then making gestures to the camera", "video-llm-prediction": "The video shows a group of children having fun in a pool. They are seen swimming and making gestures to the camera. One of the children is seen diving into the water and making gestures to the camera. The video captures the children's playful and carefree nature as they enjoy their time in the pool.", "gt-answer": "A. diving into water and then making gestures to the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the children are seen making gestures to the camera before diving into the water. Therefore, the correct order of events is making gestures to the camera and then diving into the water.", "chatgpt-answer": "B. making gestures to the camera and then diving into water", "video-llm-prediction": "In the video, a group of children are seen swimming in a pool. They are seen making gestures to the camera before diving into the water. The children seem to be enjoying themselves as they swim around the pool. The video captures the children's playful and carefree nature as they enjoy their time in the water. The children's movements are fluid and graceful, indicating that they are comfortable in the water. Overall, the video showcases the children's love for swimming and their ability to have fun while doing it.", "gt-answer": "A. diving into water and then making gestures to the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the children are first seen swimming in a pool and making gestures to the camera, and then they dive into the water and swim around. Therefore, the correct answer is B. making gestures to the camera and then diving into water.", "chatgpt-answer": "B. making gestures to the camera and then diving into water", "video-llm-prediction": "A group of children are seen swimming in a pool and making gestures to the camera. They then dive into the water and swim around.", "gt-answer": "A. diving into water and then making gestures to the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the children can be seen making gestures to the camera before diving into the water. Therefore, the correct order of events is \"making gestures to the camera and then diving into water\".", "chatgpt-answer": "B. making gestures to the camera and then diving into water", "video-llm-prediction": "The video captures a group of children having fun in a pool. They can be seen making gestures to the camera before diving into the water. The children seem to be enjoying themselves as they play and splash around in the pool. The video provides a glimpse into the carefree and playful nature of children as they enjoy the warm summer weather.", "gt-answer": "A. diving into water and then making gestures to the camera", "rating": 0 } ] }, "1093737353": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans to the right, rotates, tilts up, and zooms in.", "chatgpt-answer": "A. panning to the right", "video-llm-prediction": "The video showcases a series of beakers filled with different colored liquids, with a focus on the green liquid. The camera pans to the right, rotates, tilts up, and zooms in to provide a closer look at the green liquid. The video highlights the unique properties of the green liquid and its potential uses in various applications.", "gt-answer": "A. panning to the right", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera zooms in on the beakers, indicating that it is performing a zooming in motion.", "chatgpt-answer": "D. zooming in", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with one of them being rotated. The camera then zooms in on the beakers, providing a closer look at the green liquid. The video seems to be focused on the green liquid and its properties.", "gt-answer": "A. panning to the right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans to the right, rotates, tilts up, and zooms in.", "chatgpt-answer": "A. panning to the right", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with one beaker containing a plant. The camera pans to the right, rotates, tilts up, and zooms in to provide a closer look at the beakers. The video highlights the green liquid and the plant in the beaker, emphasizing the color green and the presence of the plant.", "gt-answer": "A. panning to the right", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans to the right, capturing the entire scene.", "chatgpt-answer": "A. panning to the right", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with one beaker containing a plant. The beakers are placed on a table, and the camera pans to the right, capturing the entire scene. The video highlights the unique properties of the green liquid and the plant, emphasizing their importance in scientific research.", "gt-answer": "A. panning to the right", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video describes the scientist mixing liquids in a beaker and then placing it on a table. After that, the experiment is observed under a microscope. This indicates that the sequence of equipment shown in the video is a beaker first, followed by a microscope.", "chatgpt-answer": "C. A beaker and then a microscope", "video-llm-prediction": "The video showcases a scientist conducting a chemical experiment in a laboratory. The scientist is seen mixing various liquids in a beaker, which is then placed on a table. The experiment is then observed under a microscope, revealing the results of the experiment. The video highlights the importance of scientific experimentation and the use of a microscope in analyzing the results.", "gt-answer": "D. A line of test tubes and then a beaker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the beakers are observed under a microscope, indicating that the microscope is shown after the beakers.", "chatgpt-answer": "C. A beaker and then a microscope", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with a microscope placed on a table next to them. The beakers are then observed under a microscope, revealing their contents. The video highlights the importance of using a microscope to observe and analyze the contents of the beakers.", "gt-answer": "D. A line of test tubes and then a beaker", "rating": 0 }, { "chatgpt-reasoning": "The video description states that a beaker is shown with a green liquid inside and a microscope is shown on the table. Based on this information, we can conclude that the beaker is shown first and then the microscope.", "chatgpt-answer": "C. A beaker and then a microscope", "video-llm-prediction": "A beaker is shown with a green liquid inside, and a microscope is shown on the table.", "gt-answer": "D. A line of test tubes and then a beaker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a scientist is first seen mixing liquids in a beaker, followed by using a microscope to observe the mixture. Therefore, the correct order of the equipment shown in the video is a beaker and then a microscope.", "chatgpt-answer": "C. A beaker and then a microscope", "video-llm-prediction": "A scientist is seen mixing liquids in a beaker, followed by a microscope being used to observe the mixture. The beaker is then filled with a green liquid and the microscope is used to observe the contents.", "gt-answer": "D. A line of test tubes and then a beaker", "rating": 0 } ] }, "1063373449": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the cells are multiplying rapidly and spreading throughout the body. The video also shows the cells being attacked by antibodies and dissolving. From this, we can infer that the coronavirus is being attacked by antibodies and dissolving.", "chatgpt-answer": "D. dissolving under the attack of antibodies", "video-llm-prediction": "The video shows a close-up of a cell, which then transitions to a large number of cells multiplying rapidly. The video then shows the cells multiplying and spreading rapidly throughout the body. The video ends with the cells being attacked by antibodies and dissolving.", "gt-answer": "D. dissolving under the attack of antibodies", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the coronavirus is mutating into a new strain.", "chatgpt-answer": "B. mutating into a new strain", "video-llm-prediction": "The video showcases the rapid spread of the coronavirus, with a focus on its mutation into a new strain. The video also highlights the effectiveness of antibodies in neutralizing the virus.", "gt-answer": "D. dissolving under the attack of antibodies", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the cell multiplies rapidly, mutates into a new strain, and spreads rapidly throughout the body. It also mentions that the cell dissolves under the attack of antibodies. These actions are associated with the behavior of a virus. Given that the question asks about the coronavirus specifically, which is a type of virus, it can be inferred that all of the choices (A, B, C, D) are correct.", "chatgpt-answer": "A. multiplying in the body", "video-llm-prediction": "The video shows a close-up of a cell, which then multiplies rapidly. The cell then mutates into a new strain and spreads rapidly throughout the body. The video ends with the cell dissolving under the attack of antibodies.", "gt-answer": "D. dissolving under the attack of antibodies", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the coronavirus is multiplying and mutating into a new strain, as well as spreading rapidly. It also highlights the effectiveness of antibodies in dissolving the virus.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "The video shows the rapid spread of the coronavirus in the body, as it multiplies and mutates into a new strain. The video also highlights the effectiveness of antibodies in dissolving the virus.", "gt-answer": "D. dissolving under the attack of antibodies", "rating": 0 } ] }, "1017768724": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the person is holding a compass in their hand and pointing it towards the camera. They then move the compass around to show the different directions. Based on this information, we can infer that the person's movement is determined by the movement of the compass.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen holding a compass in their hand and pointing it towards the camera. The person then moves the compass around to show the different directions.", "gt-answer": "D. moving rightwards", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the person is seen holding a compass in their hand and pointing it towards the camera. When the person turns the compass around, they continue to point it towards the camera. This suggests that the person is moving the compass in a circular motion around themselves while keeping it pointed towards the camera. Since there is no indication of upward or downward movement, and the person is not explicitly shown moving leftwards or rightwards, the most suitable answer would be \"None of the choices are correct\" since none of the given options accurately represent the person's movement.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen holding a compass in their hand and pointing it towards the camera. The person then turns the compass around and continues to point it towards the camera. The person then turns the compass around again and continues to point it towards the camera.", "gt-answer": "D. moving rightwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is holding a compass and pointing it towards the camera. The person then moves the compass around to show different directions. Based on this information, we can infer that the person is moving the compass horizontally in order to show the different directions. Therefore, the person's movement can be interpreted as moving rightwards.", "chatgpt-answer": "D. moving rightwards", "video-llm-prediction": "A person is seen holding a compass and pointing it towards the camera. The person then moves the compass around to show the different directions.", "gt-answer": "D. moving rightwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is holding a compass and pointing it towards the camera. The person then moves the compass around to show the different directions. From this information, we can infer that the person's movement is related to the movement of the compass. When someone is using a compass, they typically rotate it in a circular motion, which means they are moving the compass rightwards or clockwise.", "chatgpt-answer": "D. moving rightwards", "video-llm-prediction": "A person is seen holding a compass and pointing it towards the camera. The person then moves the compass around to show the different directions.", "gt-answer": "D. moving rightwards", "rating": 1 } ] }, "1106280325": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman is hiking, playing guitar, reading a book, and dancing.", "chatgpt-answer": "A. hiking", "video-llm-prediction": "A woman is seen hiking in the woods, playing guitar, reading a book, and dancing on a hillside.", "gt-answer": "C. reading book", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is seen sitting on a hillside and reading a book. None of the other choices such as hiking, playing guitar, or dancing are mentioned in the description.", "chatgpt-answer": "C. reading book", "video-llm-prediction": "A woman is seen sitting on a hillside, reading a book. She is wearing a black dress and has her legs crossed. The surrounding area is covered in grass and trees. The woman is enjoying the peaceful surroundings and seems to be lost in her book. The sun is shining brightly in the sky, casting a warm glow on the scene. The woman's hair is tied up in a ponytail, and she has a smile on her face. The camera captures the serene atmosphere of the scene, and the woman's relaxed posture. The video ends with the woman", "gt-answer": "C. reading book", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is hiking, playing guitar, reading a book, and dancing.", "chatgpt-answer": "A. hiking, B. playing guitar, C. reading book, D. dancing", "video-llm-prediction": "A woman is seen hiking in the woods, playing guitar, reading a book, and dancing on a hillside.", "gt-answer": "C. reading book", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is seen hiking in the woods, playing guitar, reading a book, and dancing on the grass. Among the given choices, all of them are mentioned in the video description. However, since the question asks for what the woman is doing, we can eliminate options A and D since they describe activities other than the main action. Therefore, the correct answer is B. playing guitar.", "chatgpt-answer": "B. playing guitar", "video-llm-prediction": "A woman is seen hiking in the woods, playing guitar, reading a book, and dancing on the grass.", "gt-answer": "C. reading book", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that both events, a girl reading a book and a body of water being shown, are happening simultaneously.", "chatgpt-answer": "A. A girl is shown reading a book and a body of water is shown simultaneously", "video-llm-prediction": "A girl is shown reading a book and a body of water is shown simultaneously.", "gt-answer": "B. A girl is shown reading a book, then a body of water is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description states that both events, the girl reading a book and the body of water shown, are happening simultaneously. This means that both events are occurring at the same time.", "chatgpt-answer": "A. A girl is shown reading a book and a body of water is shown simultaneously", "video-llm-prediction": "A girl is shown reading a book and a body of water is shown simultaneously.", "gt-answer": "B. A girl is shown reading a book, then a body of water is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that \"A girl is shown reading a book and a body of water is shown simultaneously\". This implies that both events are happening at the same time.", "chatgpt-answer": "A. A girl is shown reading a book and a body of water is shown simultaneously", "video-llm-prediction": "A girl is shown reading a book and a body of water is shown simultaneously.", "gt-answer": "B. A girl is shown reading a book, then a body of water is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girl is shown reading a book while a body of water is shown in the background. This indicates that both events are happening simultaneously, so the correct answer is A. A girl is shown reading a book and a body of water is shown simultaneously.", "chatgpt-answer": "A. A girl is shown reading a book and a body of water is shown simultaneously", "video-llm-prediction": "A girl is shown reading a book while a body of water is shown in the background. The video captures the serene and peaceful atmosphere of the location.", "gt-answer": "B. A girl is shown reading a book, then a body of water is shown", "rating": 0 } ] }, "1100117263": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the baby lion is climbing on top of an adult lion while they both lay in the grass. This indicates a vertical motion, either upward or downward. However, since the video captures the playful and carefree nature of the baby lion as it explores its surroundings, it is more likely that the baby lion is climbing upward.", "chatgpt-answer": "B. upward", "video-llm-prediction": "The video shows a baby lion climbing on top of an adult lion while they both lay in the grass. The baby lion is seen walking around and playing with the adult lion. The video captures the playful and carefree nature of the baby lion as it explores its surroundings. The adult lion seems to be content and relaxed as it allows the baby lion to climb on top of it. The video provides a glimpse into the lives of these majestic creatures and their interactions with each other.", "gt-answer": "A. downward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the baby lion is seen climbing on top of an adult lion and playing with the adult lion in the grass. Since the video description does not specify any other direction, we can assume that the baby lion's motion is upward as it climbs on top of the adult lion.", "chatgpt-answer": "B. upward", "video-llm-prediction": "A baby lion is seen climbing on top of an adult lion in the wild. The baby lion is seen biting the adult lion's neck, and the adult lion is seen licking the baby lion. The baby lion is also seen playing with the adult lion in the grass.", "gt-answer": "A. downward", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the baby lion climbs on top of its mother and then climbs down. Both actions involve vertical motion.", "chatgpt-answer": "A. downward", "video-llm-prediction": "The video shows a baby lion climbing on top of its mother while she is eating grass. The baby lion then climbs down and starts eating grass as well.", "gt-answer": "A. downward", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the baby lion is climbing on top of the adult lion and then climbs down and walks away. This indicates a vertical motion, specifically from the bottom to the top and then from the top to the bottom again.", "chatgpt-answer": "B. upward", "video-llm-prediction": "A baby lion is seen climbing on top of an adult lion while they both lay in the grass. The baby lion then climbs down and walks away.", "gt-answer": "A. downward", "rating": 0 } ] }, "15695290": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is playing soccer, reading a book, and drawing a picture. This means that the person is doing multiple activities at the same time.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen playing soccer, reading a book, and drawing a picture.", "gt-answer": "C. drawing a picture", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen playing soccer, reading a book, and drawing a picture. Therefore, the person is doing all three activities mentioned in the choices.", "chatgpt-answer": "A. playing soccer, B. reading a book, C. drawing a picture", "video-llm-prediction": "A person is seen playing soccer, reading a book, and drawing a picture.", "gt-answer": "C. drawing a picture", "rating": 0 }, { "chatgpt-reasoning": "The video description states that there are three activities happening simultaneously - playing soccer, reading a book, and drawing a picture. Therefore, the person is doing multiple things at the same time.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A person is playing soccer, a person is reading a book, and a person is drawing a picture.", "gt-answer": "C. drawing a picture", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is doing multiple activities - playing soccer, reading a book, and drawing a picture. Therefore, the correct answer would be all of the above.", "chatgpt-answer": "A. playing soccer, B. reading a book, C. drawing a picture", "video-llm-prediction": "A person is seen playing soccer, reading a book, and drawing a picture.", "gt-answer": "C. drawing a picture", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that the person starts by drawing the house and then proceeds to draw the family of people. This indicates that the order of events in the video is that the house is drawn first, followed by the family of people.", "chatgpt-answer": "A. A house is drawn, then a family of people is drawn", "video-llm-prediction": "A person is seen drawing a house and a family of people on a piece of paper. The person starts by drawing the house and then proceeds to draw the family of people. The video seems to be focused on the process of drawing the house and the family of people. The video does not provide any additional information about the context or purpose of the drawing.", "gt-answer": "A. A house is drawn, then a family of people is drawn", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the person starts by drawing the house followed by the family members. This indicates that the order of events is that the house is drawn first, and then the family of people.", "chatgpt-answer": "A. A house is drawn, then a family of people is drawn", "video-llm-prediction": "The video showcases a person drawing a house and a family of people. The person starts by drawing the house, followed by the family members. The video emphasizes the importance of family and home, and how they are interconnected. The person's hand movements are deliberate and precise, indicating a level of skill and experience in drawing. The video's overall tone is calm and peaceful, with a focus on the beauty of the drawing and the importance of family.", "gt-answer": "A. A house is drawn, then a family of people is drawn", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the person starts by drawing the house and then proceeds to draw the family of people. It also mentions that the video showcases the process of drawing the house and the family of people simultaneously, meaning both actions happen at the same time.", "chatgpt-answer": "C. The house and the family are drawn simultaneously", "video-llm-prediction": "A person is seen drawing a house and a family of people on a piece of paper. The person starts by drawing the house and then proceeds to draw the family of people. The video showcases the process of drawing the house and the family of people simultaneously.", "gt-answer": "A. A house is drawn, then a family of people is drawn", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person starts by drawing the house, followed by the family of people. This indicates a sequential order of events.", "chatgpt-answer": "A. A house is drawn, then a family of people is drawn", "video-llm-prediction": "A person is seen drawing a house and a family of people on a piece of paper. The person starts by drawing the house, followed by the family of people. The video showcases the process of drawing the house and the family, with the person carefully sketching each detail. The final result is a beautifully drawn house with a family of people surrounding it. The video is a great example of how to draw a house and a family, and it is sure to inspire anyone who loves to draw.", "gt-answer": "A. A house is drawn, then a family of people is drawn", "rating": 1 } ] }, "1091090295": { "order": [ { "chatgpt-reasoning": "The video description explicitly states that \"One of the hippos pokes its head out of the water, and a bird flies onto its back.\" This indicates that the hippo poking its head out of water happens before the bird flying onto its back.", "chatgpt-answer": "C. A hippo pokes its head out of water, then a bird flying onto the back of a hippo", "video-llm-prediction": "The video shows a group of hippos in a river. One of the hippos pokes its head out of the water, and a bird flies onto its back. The bird then flies off the hippo and lands on the water. The video captures the peaceful and serene environment of the river, with the hippos and birds coexisting in harmony. The sound of the water and the occasional splashing of the hippos add to the tranquil atmosphere. Overall, the video provides a beautiful and calming view of the natural world.", "gt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "rating": 0 }, { "chatgpt-reasoning": "The video description describes that the hippos are seen floating in the water, while the birds perch on their backs, showcasing a peaceful interaction. This implies that the birds first fly onto the back of the hippos before the hippos poke their heads out of the water.", "chatgpt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "video-llm-prediction": "The video showcases a serene scene of hippos and birds coexisting in a natural habitat. The hippos are seen floating in the water, while the birds perch on their backs. The video captures the peaceful interaction between the two species, highlighting the beauty of nature.", "gt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, it is mentioned that \"A bird flies onto the back of a hippo\" and \"the hippo pokes its head out of the water\". This indicates that the bird flying onto the back of the hippo happens first, followed by the hippo poking its head out of the water.", "chatgpt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "video-llm-prediction": "A bird flies onto the back of a hippo, and the hippo pokes its head out of the water.", "gt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the bird flies onto the back of a hippo first, and then the hippo pokes its head out of the water.", "chatgpt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "video-llm-prediction": "A bird flies onto the back of a hippo, and the hippo pokes its head out of the water.", "gt-answer": "A. A bird flying onto the back of a hippo, then a hippo pokes its head out of water", "rating": 1 } ] }, "1021488277": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that \"A person picks up the pineapple and drops it down.\" This means that the person is picking up the pineapple and then releasing/dropping it.", "chatgpt-answer": "D. A person picks up the pineapple", "video-llm-prediction": "A person picks up the pineapple and drops it down.", "gt-answer": "D. A person picks up the pineapple", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states the sequence of events: a person drops down the pineapple, then a person pushes forward the pineapple, next a person rotates the pineapple, and finally a person picks up the pineapple. This means that all of the choices mentioned in the question are correct.", "chatgpt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "A person drops down the pineapple, and then a person pushes forward the pineapple. Next, a person rotates the pineapple, and finally, a person picks up the pineapple.", "gt-answer": "D. A person picks up the pineapple", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"A person drops down the pineapple\".", "chatgpt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "A person drops down the pineapple.", "gt-answer": "D. A person picks up the pineapple", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states the sequence of actions: dropping down, pushing forward, rotating, and picking up the pineapple. Each action corresponds to one of the choices.", "chatgpt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "A person drops down the pineapple, and then a person pushes forward the pineapple. Next, a person rotates the pineapple, and finally, a person picks up the pineapple.", "gt-answer": "D. A person picks up the pineapple", "rating": 0 } ] }, "1106899445": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is brushing their teeth with a toothbrush.", "chatgpt-answer": "A. brushing teeth", "video-llm-prediction": "A person is shown brushing their teeth with a yellow toothbrush. The person then squeezes out toothpaste on the toothbrush and brushes their teeth again.", "gt-answer": "C. squeezing out toothpaste on the toothbrush", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is brushing their teeth with a toothbrush and toothpaste.", "chatgpt-answer": "A. brushing teeth", "video-llm-prediction": "A person is shown brushing their teeth with a yellow toothbrush and toothpaste. They squeeze out toothpaste on the brush and brush their teeth.", "gt-answer": "C. squeezing out toothpaste on the toothbrush", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is brushing their teeth with a yellow toothbrush.", "chatgpt-answer": "A. brushing teeth", "video-llm-prediction": "A person is shown brushing their teeth with a yellow toothbrush. They squeeze out toothpaste on the brush and brush their teeth.", "gt-answer": "C. squeezing out toothpaste on the toothbrush", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is brushing their teeth with a toothbrush and toothpaste. None of the other choices are mentioned in the video description.", "chatgpt-answer": "A. brushing teeth", "video-llm-prediction": "A person is shown brushing their teeth with a yellow toothbrush and toothpaste. They squeeze out toothpaste on the brush and use it to clean their teeth. The video emphasizes the importance of maintaining good oral hygiene.", "gt-answer": "C. squeezing out toothpaste on the toothbrush", "rating": 0 } ] }, "1067925569": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the train is seen moving along the tracks, while the ship is shown sailing in the ocean. It also mentions that the importance of both modes of transportation is emphasized, indicating that they are showcased in separate events.", "chatgpt-answer": "B. First, a cargo train is shown, then a container ship is shown", "video-llm-prediction": "The video showcases a train and a ship carrying cargo. The train is seen moving along the tracks, while the ship is shown sailing in the ocean. The video highlights the efficiency and effectiveness of cargo transportation through both land and sea routes. The train and ship are both essential components of the global supply chain, ensuring that goods are transported from one place to another. The video emphasizes the importance of these modes of transportation in today's fast-paced world. The train and ship are both crucial in ensuring that goods are delivered on time and in good condition. The video is a", "gt-answer": "A. First, a container ship is shown, then a cargo train is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the train is seen moving along the tracks first, and then the ship is shown sailing on the water. This indicates that the cargo train is shown first, followed by the container ship.", "chatgpt-answer": "B. First, a cargo train is shown, then a container ship is shown", "video-llm-prediction": "The video showcases a train and a ship, both carrying cargo. The train is seen moving along the tracks, while the ship is shown sailing on the water. The video highlights the efficiency of the transportation system and the importance of cargo transportation in the economy.", "gt-answer": "A. First, a container ship is shown, then a cargo train is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that a train and a ship are shown simultaneously. This means that both the cargo train and the container ship are shown at the same time.", "chatgpt-answer": "C. The cargo train and the container ship are shown simultaneously", "video-llm-prediction": "A train and a ship are shown simultaneously in the video.", "gt-answer": "A. First, a container ship is shown, then a cargo train is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"A train carrying containers is seen traveling along the tracks, passing by a body of water.\" This implies that the cargo train is shown first. There is no mention of a container ship being shown in the video, so option A can be ruled out. Additionally, there is no mention of the cargo train and container ship being shown simultaneously, so option C can also be ruled out. Therefore, the correct answer is B.", "chatgpt-answer": "B. First, a cargo train is shown, then a container ship is shown", "video-llm-prediction": "A train carrying containers is seen traveling along the tracks, passing by a body of water. The video showcases the movement of the train and the surrounding environment.", "gt-answer": "A. First, a container ship is shown, then a cargo train is shown", "rating": 0 } ] }, "1062609286": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the battery charge starts at 100% and gradually decreases to 0%.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "The video shows a battery charge indicator with a blue background and white text. The indicator starts at 100% and then gradually decreases to 0%. The video also shows a blue battery with a white lightning bolt on it.", "gt-answer": "C. increasing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the battery charge starts at 100% and gradually decreases. Therefore, the correct answer is A. decreasing.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "The video shows a car's battery charge, which starts at 100% and gradually decreases.", "gt-answer": "C. increasing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the battery charge is shown decreasing, staying constant, and increasing.", "chatgpt-answer": "B. staying constant", "video-llm-prediction": "A battery charge is shown decreasing, staying constant, and increasing.", "gt-answer": "C. increasing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the battery charge indicator starts at 100% and gradually decreases to 0%. This indicates that the battery charge is decreasing.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "The video displays a battery charge indicator with a blue background and white text. The indicator starts at 100% and gradually decreases to 0%.", "gt-answer": "C. increasing", "rating": 0 } ] }, "1100397435": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is seen turning off a robot vacuum cleaner, starting the robot vacuum cleaner, and fixing it.", "chatgpt-answer": "C. fixing the robot vacuum cleaner", "video-llm-prediction": "A person is seen turning off a robot vacuum cleaner in a room. The person then starts the robot vacuum cleaner and proceeds to fix it.", "gt-answer": "B. starts the robot vacuum cleaner", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is turning off the robot vacuum cleaner, starting it again, and then fixing it.", "chatgpt-answer": "A. turning off the robot vacuum cleaner", "video-llm-prediction": "A person is seen turning off a robot vacuum cleaner, and then starts it again. The person then proceeds to fix the robot vacuum cleaner.", "gt-answer": "B. starts the robot vacuum cleaner", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person turns off the robot vacuum cleaner, starts it again, and fixes it.", "chatgpt-answer": "C. fixing the robot vacuum cleaner", "video-llm-prediction": "A person turns off the robot vacuum cleaner, starts it again, and fixes it.", "gt-answer": "B. starts the robot vacuum cleaner", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is holding a vacuum cleaner and turning it on. This indicates that she is starting the vacuum cleaner.", "chatgpt-answer": "B. starts the robot vacuum cleaner", "video-llm-prediction": "A woman is seen in a kitchen, holding a vacuum cleaner and turning it on. She then proceeds to vacuum the floor.", "gt-answer": "B. starts the robot vacuum cleaner", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "The video description states that the woman is using the robot vacuum cleaner to clean the floor. Since the woman is standing in the kitchen, it can be inferred that she is cleaning the floor within the kitchen. Therefore, the vacuum cleaner would be moving across the floor, either towards the right side of the screen or towards the left side of the screen.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen standing in a kitchen and holding a robot vacuum cleaner. She then proceeds to clean the floor with the vacuum cleaner. The video showcases the woman using the robot vacuum cleaner to clean the floor.", "gt-answer": "A. to the right side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description does not explicitly mention the direction in which the robot vacuum cleaner is moving. It only mentions that the woman is using the vacuum to clean various parts of her home. Therefore, there is not enough information to determine the correct answer.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen using a robot vacuum cleaner to clean her home. She starts by placing the vacuum on the floor and then proceeds to use it to clean the kitchen floor. The woman then moves the vacuum to the living room floor and uses it to clean the floor. Throughout the video, the woman is seen using the vacuum to clean various parts of her home.", "gt-answer": "A. to the right side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is pushing the vacuum cleaner around the floor and using it to clean different areas of the home. Since the video does not specify any particular direction, we can assume that the vacuum cleaner is moving in various directions depending on the area being cleaned.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen using a robot vacuum cleaner to clean her home. She is seen pushing the vacuum cleaner around the floor and using it to clean the kitchen floor. The video shows the woman using the vacuum cleaner to clean the floor in different areas of the home.", "gt-answer": "A. to the right side of the screen", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the woman is using the robot vacuum cleaner to clean various parts of her home. However, there is no specific mention or indication of the direction in which the robot vacuum cleaner is moving.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A woman is seen using a robot vacuum cleaner to clean her home. She starts by placing the vacuum on the floor and then proceeds to use it to clean the kitchen floor. The woman then moves the vacuum to the living room floor and uses it to clean the floor. Throughout the video, the woman is seen using the vacuum to clean various parts of her home.", "gt-answer": "A. to the right side of the screen", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description clearly states that \"A person enters the screen and then the robot vacuum cleaner starts moving\". This implies that the person's entrance occurs before the robot vacuum cleaner starts moving. Therefore, option A is the correct answer.", "chatgpt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "video-llm-prediction": "A person enters the screen and then the robot vacuum cleaner starts moving. The person then proceeds to remove the filter of the vacuum cleaner.", "gt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that \"A person enters the screen and then the robot vacuum cleaner starts moving.\" This means that the person enters first and then the vacuum cleaner starts moving.", "chatgpt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "video-llm-prediction": "A person enters the screen and then the robot vacuum cleaner starts moving. The person then proceeds to remove the filter from the vacuum cleaner.", "gt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that \"A person enters the screen and then the robot vacuum cleaner starts moving.\" This indicates that the person's entry precedes the movement of the robot vacuum cleaner.", "chatgpt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "video-llm-prediction": "A person enters the screen and then the robot vacuum cleaner starts moving.", "gt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that \"A person enters the screen, and the robot vacuum cleaner starts moving.\" This indicates that the person enters first and then the robot vacuum cleaner starts moving.", "chatgpt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "video-llm-prediction": "A person enters the screen, and the robot vacuum cleaner starts moving. The person then proceeds to clean the floor.", "gt-answer": "A. A person enters the screen and then the robot vacuum cleaner starts moving", "rating": 1 } ] }, "1108534143": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the puppy is seen walking into a wigwam and then walking out of it. It also mentions that the puppy is staying still in the wigwam.", "chatgpt-answer": "C. walking out of a wigwam", "video-llm-prediction": "A white puppy is seen walking into a wigwam and then walking out of it. The video shows the puppy staying still in the wigwam.", "gt-answer": "C. walking out of a wigwam", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the puppy is seen walking into a wigwam and then walking out of it. Therefore, the correct answer is B. walking into a wigwam. The option A, staying in a wigwam, cannot be supported by the video description as it only mentions the puppy standing still at one point inside the wigwam, but not staying there. Option C, walking out of a wigwam, is partially correct, but it does not cover the full action of the puppy walking into the wigwam first before walking out.", "chatgpt-answer": "B. walking into a wigwam", "video-llm-prediction": "A small white puppy is seen walking into a wigwam and then walking out of it. The puppy is seen standing still in the wigwam at one point.", "gt-answer": "C. walking out of a wigwam", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white puppy is walking into a wigwam and then walking out of it. This indicates that the puppy is not staying in the wigwam but rather going in and coming out.", "chatgpt-answer": "C. walking out of a wigwam", "video-llm-prediction": "A white puppy is seen walking into a wigwam and then walking out of it. The puppy is seen standing still in the wigwam at one point.", "gt-answer": "C. walking out of a wigwam", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the puppy is seen walking into a wigwam and then walking out of it. It also states that the puppy is seen standing still in the wigwam at one point. Based on this information, we can conclude that the puppy is both walking into and walking out of the wigwam.", "chatgpt-answer": "C. walking out of a wigwam", "video-llm-prediction": "A small white puppy is seen walking into a wigwam and then walking out of it. The puppy is seen standing still in the wigwam at one point.", "gt-answer": "C. walking out of a wigwam", "rating": 1 } ] }, "1034049020": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the woman is seen walking down the street while holding a paint roller, and then proceeds to clean a wall while walking. This indicates that she is cleaning a wall while walking.", "chatgpt-answer": "A. cleaning a wall while walking", "video-llm-prediction": "A woman is seen walking down the street while holding a paint roller. She then proceeds to clean a wall while walking.", "gt-answer": "C. painting a wall while walking", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is seen walking down the street while holding a paint roller. It further mentions that she proceeds to clean a wall while walking. Therefore, the woman is cleaning a wall while walking.", "chatgpt-answer": "A. cleaning a wall while walking", "video-llm-prediction": "A woman is seen walking down the street while holding a paint roller. She then proceeds to clean a wall while walking. The video showcases the woman's ability to multitask and complete various tasks while on the move.", "gt-answer": "C. painting a wall while walking", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is seen walking down the street while holding a paint roller. Then, it states that she proceeds to clean a wall while walking. This indicates that the woman is cleaning a wall while walking.", "chatgpt-answer": "A. cleaning a wall while walking", "video-llm-prediction": "A woman is seen walking down the street while holding a paint roller. She then proceeds to clean a wall while walking.", "gt-answer": "C. painting a wall while walking", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is walking down the street while holding a paintbrush. It also mentions that she proceeds to clean a wall while walking and continues to walk and paint the wall as she goes. This indicates that the woman is painting a wall while walking.", "chatgpt-answer": "C. painting a wall while walking", "video-llm-prediction": "A woman is seen walking down the street while holding a paintbrush. She then proceeds to clean a wall while walking. The woman continues to walk and paint the wall as she goes.", "gt-answer": "C. painting a wall while walking", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description states that the woman is seen walking down a street and then turns around to paint a wall. The description further mentions that she continues to walk while painting the wall. Therefore, the correct order of events is that she turns back first, then paints the wall while walking.", "chatgpt-answer": "B. Turning back, then painting a wall while walking", "video-llm-prediction": "A woman is seen walking down a street and then turns around to paint a wall. She continues to walk while painting the wall.", "gt-answer": "C. Painting a wall while walking, then turning back", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is seen walking down the street and then turning back to paint a wall. She continues to walk down the street while painting the wall. This indicates that the order of events is first turning back, then painting a wall while walking.", "chatgpt-answer": "B. Turning back, then painting a wall while walking", "video-llm-prediction": "A woman is seen walking down the street and then turning back to paint a wall. She continues to walk down the street while painting the wall.", "gt-answer": "C. Painting a wall while walking, then turning back", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is first seen walking down the street, then she turns around to paint a wall, and finally continues to walk while painting the wall. This indicates that the order of events is: turning back, then painting a wall while walking.", "chatgpt-answer": "B. Turning back, then painting a wall while walking", "video-llm-prediction": "A woman is seen walking down the street and then turns around to paint a wall. She continues to walk while painting the wall.", "gt-answer": "C. Painting a wall while walking, then turning back", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is seen walking down the street while holding a paintbrush. Then, she turns around and begins painting a wall. Finally, she continues to walk down the street while painting the wall. This indicates that the correct order of events is B. Turning back, then painting a wall while walking.", "chatgpt-answer": "B. Turning back, then painting a wall while walking", "video-llm-prediction": "A woman is seen walking down the street while holding a paintbrush. She turns around and begins painting a wall. She continues to walk down the street while painting the wall.", "gt-answer": "C. Painting a wall while walking, then turning back", "rating": 0 } ] }, "1047368344": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the girl jumps into the water and swims towards the shore.", "chatgpt-answer": "C. swimming in the water", "video-llm-prediction": "A girl wearing a yellow dress is seen walking on a wooden pier. She then jumps into the water and swims towards the shore.", "gt-answer": "A. jumping into water", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the girl jumps into the water and swims towards the shore.", "chatgpt-answer": "C. swimming in the water", "video-llm-prediction": "The video shows a girl wearing a yellow dress who is seen walking on a wooden pier. She then jumps into the water and swims towards the shore. The video captures the beauty of the surrounding nature, with mountains and trees visible in the background. The girl's movements are graceful and fluid, and she seems to be enjoying the water. The video is a perfect representation of the serene and peaceful environment that the girl is in.", "gt-answer": "A. jumping into water", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is seen walking on a dock and then jumping into the water.", "chatgpt-answer": "A. jumping into water", "video-llm-prediction": "A woman in a yellow dress is seen walking on a dock and then jumping into the water.", "gt-answer": "A. jumping into water", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the girl jumps into the water and swims towards the shore.", "chatgpt-answer": "C. swimming in the water", "video-llm-prediction": "A girl wearing a yellow dress is seen walking on a wooden pier. She then jumps into the water and swims towards the shore.", "gt-answer": "A. jumping into water", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description states that the girl first walks on a wooden pier and then proceeds to jump into the water. After that, she takes off her clothes and jumps back into the water. Therefore, the correct order of events for the girl is jumping into water and then taking off clothes.", "chatgpt-answer": "D. jumping into water and then taking off clothes", "video-llm-prediction": "A girl is seen walking on a wooden pier and then proceeds to jump into the water. She then takes off her clothes and jumps back into the water.", "gt-answer": "B. taking off clothes and then jumping into water", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is first seen walking on a dock and then jumping into the water. Afterward, she proceeds to take off her clothes and jumps back into the water. Therefore, the correct order of events for the woman is jumping into the water and then taking off clothes.", "chatgpt-answer": "D. jumping into water and then taking off clothes", "video-llm-prediction": "A woman is seen walking on a dock and then jumping into the water. She then proceeds to take off her clothes and jumps back into the water.", "gt-answer": "B. taking off clothes and then jumping into water", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the girl is walking on a wooden pier, then jumping into the water and swimming towards the shore. After that, she puts on her clothes and jumps into the water again. Hence, the correct order of events for the girl is jumping into water and then putting on clothes.", "chatgpt-answer": "C. jumping into water and then putting on clothes", "video-llm-prediction": "A girl is seen walking on a wooden pier, then she jumps into the water and swims towards the shore. She then puts on her clothes and jumps into the water again.", "gt-answer": "B. taking off clothes and then jumping into water", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the girl is first seen walking on a wooden pier, then she takes off her clothes and jumps into the water. Afterward, she puts on her clothes and jumps into the water again. Therefore, the order of events for the girl is:", "chatgpt-answer": "B. taking off clothes and then jumping into water", "video-llm-prediction": "A girl is seen walking on a wooden pier, then she takes off her clothes and jumps into the water. She then puts on her clothes and jumps into the water again.", "gt-answer": "B. taking off clothes and then jumping into water", "rating": 1 } ] }, "1060403198": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the tree is seen with green leaves and branches, which gradually changes to brown and shedding leaves. This indicates that the tree is changing color and shedding leaves.", "chatgpt-answer": "D. changing color", "video-llm-prediction": "The video showcases a tree with green leaves and branches, which gradually changes to brown and shedding leaves. The tree is seen in various positions, including a close-up shot of its branches and leaves. The video also includes a shot of a tree with no leaves, and a close-up shot of a tree with green leaves. The video emphasizes the tree's growth and changes throughout the seasons.", "gt-answer": "A. increasing height", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the tree is seen changing from green leaves to brown and shedding leaves. This indicates that the tree is changing color and shedding leaves.", "chatgpt-answer": "D. changing color", "video-llm-prediction": "The video showcases a tree with green leaves and branches, which gradually changes to brown and shedding leaves. The tree is seen in different positions, including a close-up shot of the branches and leaves. The video highlights the tree's growth and changes throughout the seasons.", "gt-answer": "A. increasing height", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the tree is shown in different seasons, including winter and fall. It also states that the tree is seen in different positions and ends with a close-up shot of the tree. This indicates that the tree is going through changes. The video shows the tree in different positions and focuses on its leaves and colors, suggesting that the tree is changing color.", "chatgpt-answer": "D. changing color", "video-llm-prediction": "A tree with green leaves is shown in the video. The tree is seen in different positions, including a close-up shot of the leaves and a wider shot of the tree. The video also shows the tree in different seasons, including winter and fall. The tree is shown in a white background, and the video ends with a close-up shot of the tree.", "gt-answer": "A. increasing height", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the leaves of the tree turn yellow and fall off. This indicates that the tree is shedding its leaves.", "chatgpt-answer": "C. shedding leaves", "video-llm-prediction": "A tree with green leaves is shown in the video. The leaves turn yellow and fall off the tree. The tree is also shown with no leaves.", "gt-answer": "A. increasing height", "rating": 0 } ] }, "1100074677": { "order": [ { "chatgpt-reasoning": "The video description states that the person is seen standing the paper note up and then writing something on it. They then proceed to tear the paper note apart and throw it away. This indicates that the correct order of events is first standing the paper note up, then writing something on it, and finally tearing it apart and throwing it away.", "chatgpt-answer": "C. standing the paper note up and then writing something on the paper note", "video-llm-prediction": "A person is seen standing a paper note up and then writing something on it. They then proceed to tear the paper note apart and throw it away.", "gt-answer": "D. writing something on the paper note and then standing the paper note up", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person writes on a piece of paper, tears it apart and throws it away. Then, the person stands the paper note up and writes something on it. This sequence of events indicates that the correct order is: tearing apart the paper note and then throwing it away, followed by standing the paper note up and then writing something on it.", "chatgpt-answer": "B. tearing apart the paper note and then throwing it away", "video-llm-prediction": "A person is seen writing on a piece of paper, followed by tearing it apart and throwing it away. The person then stands the paper note up and writes something on it.", "gt-answer": "D. writing something on the paper note and then standing the paper note up", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person first tears apart the paper note and then throws it away. After that, the same person stands the paper note up and writes something on it.", "chatgpt-answer": "B. tearing apart the paper note and then throwing it away", "video-llm-prediction": "A person is seen tearing apart a paper note and then throwing it away. The same person is then seen standing the paper note up and writing something on it.", "gt-answer": "D. writing something on the paper note and then standing the paper note up", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person is seen writing on a paper note, which is then torn apart and thrown away. Therefore, the correct order of events would be \"writing something on the paper note\" followed by \"tearing apart the paper note\" and then \"throwing it away\".", "chatgpt-answer": "D. writing something on the paper note and then tearing apart the paper note", "video-llm-prediction": "A person is seen writing on a paper note, which is then torn apart and thrown away. The video showcases the process of writing, tearing, and throwing away the paper note.", "gt-answer": "D. writing something on the paper note and then standing the paper note up", "rating": 1 } ] }, "1100350201": { "order": [ { "chatgpt-reasoning": "The video description mentions that the man is seen kneeling down and putting something in the little girl's hand, then he stands up and puts his hand on the little girl's shoulder. This indicates that the man takes action before the girl.", "chatgpt-answer": "C. The little girl is drawn and then the man is drawn", "video-llm-prediction": "The video shows a man and a little girl. The man is seen kneeling down and putting something in the little girl's hand. He then stands up and puts his hand on the little girl's shoulder. The video ends with the man and the little girl standing next to each other.", "gt-answer": "C. The little girl is drawn and then the man is drawn", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is adjusting the girl's hair, then proceeds to brush her hair. The girl sits down, and the man continues to brush her hair. There is no mention or indication of any drawing or erasing happening in the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a little girl standing in front of a mirror. The man is seen adjusting the girl's hair, and then he proceeds to brush her hair. The girl then sits down, and the man continues to brush her hair. The video seems to be a simple yet heartwarming scene of a man taking care of a little girl's hair. The video's simplicity is what makes it so relatable, as it could be any father or guardian taking care of their child's hair. The video's message is clear, and it is to show the love", "gt-answer": "C. The little girl is drawn and then the man is drawn", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen kneeling down and putting something on the little girl's hand. It then mentions that he stands up and walks away. This indicates that the man is drawn first and then the little girl appears in the video.", "chatgpt-answer": "C. The little girl is drawn and then the man is drawn", "video-llm-prediction": "The video shows a man and a little girl. The man is seen kneeling down and putting something on the little girl's hand. He then stands up and walks away.", "gt-answer": "C. The little girl is drawn and then the man is drawn", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man is kneeling down and putting something on the little girl's hand, and then he stands up and walks away. This implies that the man is present in the video before the little girl, and he interacts with her before leaving.", "chatgpt-answer": "C. The little girl is drawn and then the man is drawn", "video-llm-prediction": "The video shows a man and a little girl. The man is seen kneeling down and putting something on the little girl's hand. He then stands up and walks away.", "gt-answer": "C. The little girl is drawn and then the man is drawn", "rating": 1 } ] }, "1099109715": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the variety of fruits and vegetables is being showcased. It also emphasizes the importance of consuming a diverse range of fruits and vegetables. Both of these points indicate that the number of fruits and vegetables is increasing.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, oranges, and carrots. The fruits and vegetables are displayed on a black table, and the video emphasizes the importance of consuming a diverse range of fruits and vegetables for a healthy diet. The video also highlights the benefits of consuming fruits and vegetables, such as improved digestion and overall health.", "gt-answer": "B. increasing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a variety of fruits and vegetables are showcased, including tomatoes, oranges, and broccoli. However, it does not mention any changes happening to the number of fruits and vegetables.", "chatgpt-answer": "D. staying the same", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, oranges, and broccoli. The tomatoes are shown in different positions, including on a table and in a bowl. The oranges are also displayed in various positions, including on a table and in a bowl. The broccoli is shown in a bowl. The video emphasizes the importance of consuming a variety of fruits and vegetables for a healthy diet.", "gt-answer": "B. increasing", "rating": 0 }, { "chatgpt-reasoning": "The video showcases a variety of fruits and vegetables and emphasizes the importance of consuming a healthy diet. However, there is no information provided in the video description about any changes happening to the number of fruits and vegetables.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, apples, and oranges. The fruits and vegetables are displayed on a black background, with some of them being cut up and displayed in bowls. The video emphasizes the importance of consuming a healthy diet, with a focus on fruits and vegetables.", "gt-answer": "B. increasing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the various fruits and vegetables are being showcased, including tomatoes, oranges, and broccoli. It also emphasizes the importance of consuming a variety of fruits and vegetables for a healthy diet. From this information, we can infer that the number of fruits and vegetables is likely increasing or staying the same, as there is no mention of them becoming rotten or decreasing in quantity.", "chatgpt-answer": "D. staying the same", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, oranges, and broccoli. The tomatoes are shown in different positions, including on a table and in a bowl. The oranges are also displayed in various positions, including on a table and in a bowl. The broccoli is shown in a bowl. The video emphasizes the importance of consuming a variety of fruits and vegetables for a healthy diet.", "gt-answer": "B. increasing", "rating": 0 } ] }, "1051211272": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the sandwich is cut in half and the bottom half is eaten. This indicates that the sandwich is gradually being eaten out and disappearing.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "The video shows a close-up of a sandwich with tomatoes and cream cheese on top of a piece of bread. The sandwich is then cut in half and the bottom half is eaten. The video ends with a close-up of the bread.", "gt-answer": "C. gradually being eaten out and disappearing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sandwich is being eaten, with the sound of it being cut and eaten audible. This indicates that the sandwich is gradually being eaten out and disappearing.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "A close-up shot of a sandwich is shown, with a leaf placed on top of it. The sandwich is then cut in half, revealing the creamy filling inside. The sandwich is then eaten, with the leaf still on top. The video showcases the process of making and eating a sandwich with cream cheese. The focus is on the sandwich and its filling, with the leaf serving as a decorative element. The video is shot in a simple and straightforward manner, with no additional elements or props. The sound of the sandwich being cut and eaten is also audible,", "gt-answer": "C. gradually being eaten out and disappearing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the toast with cream cheese is gradually being eaten out and disappearing.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "A piece of toast with cream cheese is shown, and it gradually gets eaten out and disappears.", "gt-answer": "C. gradually being eaten out and disappearing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is making a sandwich by putting cream cheese on bread, adding tomatoes on top, cutting it in half, and eating it. There is no indication that the toast with cream cheese is getting bigger or staying the same size. However, it is mentioned that the sandwich is being eaten out and disappearing gradually.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "A person is seen making a sandwich by putting cream cheese on bread and adding tomatoes on top. The sandwich is then cut in half and eaten.", "gt-answer": "C. gradually being eaten out and disappearing", "rating": 1 } ] }, "1059815936": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the paper is transforming from a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video showcases the transformation of a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball. The process is repeated several times, highlighting the versatility of the paper.", "gt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the paper is going through a process of transformation from a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video showcases the process of transforming a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball. The video starts with a close-up shot of a wrinkled paper ball, which then transitions into a flattened sheet of paper. The flattened sheet of paper is then shown being transformed back into a wrinkled paper ball. The video provides a visual representation of the process of transforming a wrinkled paper ball into a flattened sheet and back into a wrinkled paper ball.", "gt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the paper is being crumpled up and then flattened out multiple times. This indicates a continuous process of changing from a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video shows a piece of paper being crumpled up and then flattened out. The paper is then crumpled up again and flattened out once more.", "gt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the paper is transforming from a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video showcases the process of transforming a wrinkled paper ball into a flattened sheet and then back into a wrinkled paper ball.", "gt-answer": "A. changing from wrinkled paper ball into a flattened sheet", "rating": 1 } ] }, "1086423566": { "order": [ { "chatgpt-reasoning": "The video description mentions that the camera starts with a bowl of rice and beans, pans out to show the entire bowl, zooms in to show the ingredients being added, and then pans out again to show the entire bowl. This indicates that the food is added into the bowl first, and then the bowl is shown rotating.", "chatgpt-answer": "B. Food is added into the bowl and then the bowl rotates", "video-llm-prediction": "The video starts with a bowl of rice and beans, and then the camera pans out to show the entire bowl. The camera then zooms in to show the ingredients being added to the bowl. The ingredients include shrimp, tomatoes, and avocado. The camera then pans out to show the entire bowl again. The video ends with the camera panning out to show the entire bowl.", "gt-answer": "B. Food is added into the bowl and then the bowl rotates", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person starts by adding rice and beans to the bowl, followed by adding a variety of vegetables, seasoning, and onions. There is no mention of the bowl rotating or flipping upside down in the video description.", "chatgpt-answer": "B. Food is added into the bowl and then the bowl rotates", "video-llm-prediction": "The video showcases a person preparing a healthy and delicious meal by adding various ingredients to a bowl. The person starts by adding rice and beans to the bowl, followed by adding a variety of vegetables, including tomatoes, avocado, and shrimp. The person then proceeds to add some seasoning and onions to the mixture, which is then stirred to combine all the ingredients. The final result is a colorful and nutritious meal that is perfect for a healthy lunch or dinner.", "gt-answer": "B. Food is added into the bowl and then the bowl rotates", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the bowl rotates before the food is added, then it rotates again after the ingredients are added, and finally, it flips upside down.", "chatgpt-answer": "A. The bowl rotates and then food is added into the bowl", "video-llm-prediction": "A bowl of food is shown, and then the bowl rotates. Tomatoes, shrimp, and rice are added to the bowl, and the bowl rotates again. Finally, the bowl flips upside down.", "gt-answer": "B. Food is added into the bowl and then the bowl rotates", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the order of events in the video is that food is added into the bowl and then the bowl rotates.", "chatgpt-answer": "A. The bowl rotates and then food is added into the bowl", "video-llm-prediction": "A video showcases the process of making a healthy and delicious meal. The video starts with a bowl of rice and beans, which is then topped with various vegetables, including tomatoes, avocado, and shrimp. The ingredients are mixed together, and the final product is presented in a visually appealing manner. The video emphasizes the importance of incorporating healthy ingredients into one's diet and provides a step-by-step guide to making this meal. Overall, the video is informative and inspiring, encouraging viewers to try", "gt-answer": "B. Food is added into the bowl and then the bowl rotates", "rating": 0 } ] }, "1069611487": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the video starts with a close-up shot of a pizza box, then shows a pizza being cut into slices, followed by the slices being eaten, and finally ends with the pizza box being shown again. Therefore, the correct order of events in the video is that the paper box appears first, then the pizza slices appear.", "chatgpt-answer": "B. Pizza slices appear, then a paper box appears", "video-llm-prediction": "The video starts with a close-up shot of a pizza box, and then we see a pizza being cut into slices. The slices are then shown being eaten, and the video ends with the pizza box being shown again.", "gt-answer": "C. A paper box appears, then pizza slices disappear", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the pizza is being cut into slices and then being eaten. Therefore, the correct order of events in the video should be that the pizza slices appear first, followed by a paper box appearing.", "chatgpt-answer": "B. Pizza slices appear, then a paper box appears", "video-llm-prediction": "The video showcases a pizza being cut into slices and then being eaten. The pizza slices are shown being taken away from the box, and the box is shown being opened. The video provides a visual representation of the pizza being cut and eaten.", "gt-answer": "C. A paper box appears, then pizza slices disappear", "rating": 0 }, { "chatgpt-reasoning": "The video description states that initially, a slice of pizza is missing from the box. Then, several slices go missing. This implies that the pizza slices disappear first and then a paper box is shown.", "chatgpt-answer": "A. Pizza slices disappear, then a paper box appears", "video-llm-prediction": "A pizza box is shown with a slice of pizza missing. The box is then shown with several slices missing.", "gt-answer": "C. A paper box appears, then pizza slices disappear", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the pizza box is shown with a slice of pizza missing first, and then it is shown with all the slices missing. This implies that the pizza slices disappear before the paper box appears.", "chatgpt-answer": "A. Pizza slices disappear, then a paper box appears", "video-llm-prediction": "A pizza box is shown with a slice of pizza missing. The box is then shown with all the slices missing.", "gt-answer": "C. A paper box appears, then pizza slices disappear", "rating": 0 } ] }, "1034419625_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the man is seen moving away from the camera and towards it. Therefore, the correct answer is C. moving away from the camera.", "chatgpt-answer": "C. moving away from the camera", "video-llm-prediction": "The video shows a man playing basketball in a dark room. He is seen dribbling the ball and making a shot into the basket. The man is also seen moving away from the camera and towards it.", "gt-answer": "B. moving from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the direction of the man's movement. It only describes the man dribbling a basketball and making a shot, but there is no indication of his movement towards or away from the camera or from left to right or right to left.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen dribbling a basketball and making a shot. The video showcases the man's basketball skills and his ability to make a shot.", "gt-answer": "B. moving from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the man is moving away from the camera.", "chatgpt-answer": "C. moving away from the camera", "video-llm-prediction": "A man is seen moving away from the camera while holding a basketball.", "gt-answer": "B. moving from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is playing basketball, but it does not provide any information about his direction of movement. Therefore, we cannot determine the direction based on the given description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen playing basketball in a dark room. He is seen dribbling the ball and then throwing it into the basket.", "gt-answer": "B. moving from right to left", "rating": 0 } ] }, "1094590221_reverse": { "direction": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that the man is seen dribbling the ball and throwing it into the basket. This implies that the basketball is moving towards the basket, which means it is moving in a straight ahead direction.", "chatgpt-answer": "A. straight ahead", "video-llm-prediction": "A man is seen playing basketball in a court. He is seen dribbling the ball and then throwing it into the basket. The video shows the man playing basketball in different positions and angles.", "gt-answer": "B. left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is playing basketball and dribbling the ball. When a player dribbles the ball, it typically moves in the direction they are moving. Therefore, based on the information provided, we can infer that the basketball is moving in the same direction as the man's movements.", "chatgpt-answer": "A. straight ahead", "video-llm-prediction": "A man is seen playing basketball in a court. He is seen dribbling the ball and then throwing it into the basket. The video captures the man's movements as he plays basketball.", "gt-answer": "B. left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a basketball player shoots a basket. Based on the traditional movement of shooting a basketball, the player would typically shoot straight ahead towards the basket.", "chatgpt-answer": "A. straight ahead", "video-llm-prediction": "A basketball player shoots a basket while the sun sets in the background.", "gt-answer": "B. left to right", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the man throws the ball up in the air and makes a basket. This indicates that the basketball is moving vertically, from bottom to top.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen playing basketball in a court. He throws the ball up in the air and makes a basket.", "gt-answer": "B. left to right", "rating": 0 } ] }, "1111657885_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that some people are skating towards the camera and others are skating parallel to the screen.", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "A group of people are skating on an ice rink, with some skating towards the camera and others skating parallel to the screen.", "gt-answer": "C. away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that \"Some of them are skating towards the camera while others are skating parallel to the screen.\"", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "The video shows a group of people skating on an ice rink. Some of them are skating towards the camera while others are skating parallel to the screen. The skaters are wearing different colored outfits, and the ice rink is surrounded by a blue wall. The video captures the skaters' movements as they glide across the ice, with some of them performing tricks and jumps. The sound of the skates scraping against the ice and the cheers of the spectators can be heard in the background. Overall, the video showcases the beauty and excitement of ice skating", "gt-answer": "C. away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that some people are skating towards the camera while others are skating parallel to the screen.", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "People are skating on an ice rink, some are skating towards the camera while others are skating parallel to the screen.", "gt-answer": "C. away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that some people are skating towards the camera and others are skating parallel to the screen. Therefore, the correct answer is A. towards the camera.", "chatgpt-answer": "A. towards the camera", "video-llm-prediction": "People are skating on an ice rink, with some skating towards the camera and others skating parallel to the screen.", "gt-answer": "C. away from the camera", "rating": 0 } ] }, "1089810425_reverse": { "direction": [ { "chatgpt-reasoning": "The video description does not mention any specific panning direction. However, it states that the video starts with a man and a woman standing in the pool, then shows a group of people in the pool, and ends with the group still in the pool. Since there is no mention of any movement or change in position, it can be inferred that there is no panning in the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of people having fun in a pool. They are throwing water at each other and laughing. The video starts with a man and a woman standing in the pool, and then it shows a group of people in the pool. The people in the pool are throwing water at each other and having a great time. The video ends with the group of people still in the pool, still throwing water at each other.", "gt-answer": "A. left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans from left to right, showing the entire group.", "chatgpt-answer": "A. left to right", "video-llm-prediction": "The video captures a group of people having fun in a pool. They are seen splashing water and dancing around. The camera pans from left to right, showing the entire group. The video is a perfect representation of a fun day spent with friends in the pool.", "gt-answer": "A. left to right", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention anything about the panning direction. It only describes the activities of people in a pool. Therefore, there is not enough information to determine the correct answer.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of people are seen playing in a pool and throwing water at each other.", "gt-answer": "A. left to right", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a group of people is having fun in a pool by throwing water at each other while dancing. None of the options mention anything related to the movement of the camera. Therefore, it is not possible to determine the direction of the panning based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a group of people having fun in a pool by throwing water at each other while dancing.", "gt-answer": "A. left to right", "rating": 0 } ] }, "1059718130_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the sun is setting in the sky. It also states that the sun appears to rise and set in the same location. This indicates that the sun is moving downward, or setting.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The video showcases the sun setting in the sky, with the sun appearing to rise and set in the same location. The sun is seen in the sky, with clouds moving around it. The video captures the beauty of the sunset and the changing colors of the sky.", "gt-answer": "A. falling", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that \"The sun sets in the sky,\" indicating that the sun is moving downwards in the sky.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The sun sets in the sky, casting a warm glow on the clouds. The sun's rays reflect off the clouds, creating a beautiful display of colors. The sun sets in the sky, casting a warm glow on the clouds. The sun's rays reflect off the clouds, creating a beautiful display of colors.", "gt-answer": "A. falling", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the sun is setting in the sky, indicating that it is moving downwards.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The sun sets in the sky, and the clouds move around it.", "gt-answer": "A. falling", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the sun sets in the sky, which means it is moving in a downward direction.", "chatgpt-answer": "A. setting", "video-llm-prediction": "The sun sets in the sky, and the clouds move in the same direction as the sun.", "gt-answer": "A. falling", "rating": 1 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly mentions that the sky is getting darker, indicating a decrease in brightness.", "chatgpt-answer": "A. getting darker", "video-llm-prediction": "The video shows a beautiful sunset with the sun setting in the sky. The sun is seen setting in the sky, and the sky is getting darker. The video captures the beauty of the sunset and the changing colors of the sky.", "gt-answer": "A. getting darker", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sky gradually gets darker as the sun sets behind the clouds. This implies that the brightness of the video is getting darker.", "chatgpt-answer": "A. getting darker", "video-llm-prediction": "The video showcases a beautiful sunset with the sun setting behind a cloudy sky. The sun is seen setting behind the clouds, and the sky gradually gets darker. The video captures the serene beauty of the sunset, with the sun setting behind the clouds, and the sky gradually getting darker. The video is a perfect representation of the beauty of nature and the tranquility of the sunset.", "gt-answer": "A. getting darker", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the sun is seen getting darker as the video progresses. This indicates a decrease in brightness.", "chatgpt-answer": "A. getting darker", "video-llm-prediction": "The video shows a large sun setting behind a cloudy sky. The sun is seen getting darker as the video progresses.", "gt-answer": "A. getting darker", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically mentions that the sun in the video is getting darker and brighter. This implies that the overall brightness of the video is changing.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video captures the sunset, with the sun getting darker and brighter, while the sky remains the same.", "gt-answer": "A. getting darker", "rating": 0 } ] }, "1083845854_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the clock hands are moving in a counterclockwise direction.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video shows a clock with a red second hand and a black minute hand. The clock is positioned in the middle of the frame, and the hands move in a counterclockwise direction. The video also includes a close-up shot of the clock's face, which is positioned in the middle of the frame. The video ends with a shot of the clock's face, which is positioned in the middle of the frame.", "gt-answer": "A. counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the clock's hands are moving in a counterclockwise direction.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video showcases a close-up of a clock with its hands moving in a counterclockwise direction. The clock's hands move in a stationary position, and the video provides a detailed view of the clock's hands. The video's focus is on the clock's hands, and the information provided is not relevant to the video content.", "gt-answer": "A. counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the second hand of the clock is moving in a counterclockwise direction. This means that the direction in which the clock hands are moving is counterclockwise.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video shows a clock with a red second hand moving from 12 to 6. The video also includes a piece of information that the second hand moves in a counterclockwise direction.", "gt-answer": "A. counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the first hand is moving counterclockwise while the second hand is moving clockwise.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video showcases a clock with its hands moving in different directions. The first hand moves counterclockwise, while the second hand moves clockwise. The video also features a close-up shot of the clock's face, highlighting the intricate details of the clock's design. The video provides a detailed view of the clock's mechanics and the precision of its movements.", "gt-answer": "A. counterclockwise", "rating": 1 } ] }, "1100329207_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans around the field, showing the sheep in different positions. Panning refers to moving the camera horizontally while keeping the vertical axis fixed. If the camera is panning and showing the sheep in different positions, it means the camera view is moving horizontally.", "chatgpt-answer": "A. moving right", "video-llm-prediction": "The video shows a large herd of sheep grazing in a field. The camera pans around the field, showing the sheep in different positions. The sheep are seen grazing on the grass and walking around the field. The video captures the peaceful and serene atmosphere of the countryside.", "gt-answer": "B. moving backward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the sheep as they move around the field, with some walking towards the camera and others walking away. This implies that the camera is in a stationary position and not moving in any particular direction.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a large herd of sheep grazing in a vast, open field. The camera captures the sheep as they move around the field, with some walking towards the camera and others walking away. The sky is blue and clear, and the landscape is vast and open, with no visible boundaries. The sheep are seen grazing on the grass, and the camera captures their movements as they move around the field. The video provides a peaceful and serene view of the countryside, with the sound of the wind and the occasional bleating of the sheep. Overall, the video is a beautiful", "gt-answer": "B. moving backward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the field, which indicates that the camera view is moving.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a large herd of sheep grazing in a field. The camera pans around the field, showing the sheep in different positions. The sheep are seen grazing on the grass and walking around the field. The video captures the peaceful and serene environment of the field, with the sound of the wind and the occasional bleat of the sheep. Overall, the video provides a calming and relaxing experience for the viewer.", "gt-answer": "B. moving backward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera is capturing the movements of the sheep from various angles. It does not specify the exact direction of the camera movement, but it implies that the camera is moving around the sheep to capture their movements and grazing from different perspectives.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A herd of sheep is seen grazing in a field, with the camera capturing their movements from various angles. The sheep are seen walking around and grazing on the grass, with some of them looking towards the camera. The video showcases the peaceful and serene environment of the field, with the sheep appearing content and relaxed. The camera captures the natural beauty of the field, with the sheep and the grass providing a sense of tranquility. Overall, the video provides a calming and soothing experience for the viewer.", "gt-answer": "B. moving backward", "rating": 0 } ] }, "1089201973_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the ball is kicked from the left side of the field towards the right side. This indicates that the football is moving from left to right.", "chatgpt-answer": "A. moving from left to right", "video-llm-prediction": "A person is seen kicking a soccer ball on a field. The ball is kicked from the left side of the field towards the right side. The person kicks the ball with their feet and the ball flies through the air. The person continues to kick the ball towards the right side of the field.", "gt-answer": "B. moving from right to left", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the person is seen kicking the ball towards the right side of the field multiple times. Each time they kick with their right foot, the ball flies towards the right side, and when they kick with their left foot, the ball flies towards the left side. Therefore, the direction of the football in the video is moving from left to right.", "chatgpt-answer": "A. moving from left to right", "video-llm-prediction": "A person is seen kicking a soccer ball on a field. The ball is kicked from the left side of the field towards the right side. The person kicks the ball with their right foot, and the ball flies towards the right side of the field. The person continues to kick the ball, and the ball is kicked towards the right side of the field. The person kicks the ball with their left foot, and the ball flies towards the left side of the field. The person kicks the ball with their right foot, and the ball flies towards the right side of the field. The person k", "gt-answer": "B. moving from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the ball is kicked from the left side of the field towards the right side. Therefore, the direction of the football in the video is moving from left to right.", "chatgpt-answer": "A. moving from left to right", "video-llm-prediction": "A person is seen kicking a soccer ball on a field. The ball is kicked from the left side of the field towards the right side. The person kicks the ball with their feet and the ball flies through the air.", "gt-answer": "B. moving from right to left", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the person kicks the ball towards the right side of the field twice and towards the left side of the field twice. This indicates that the ball is changing its direction alternately between left and right.", "chatgpt-answer": "C. stationary", "video-llm-prediction": "A person is seen kicking a soccer ball on a field. The ball is kicked from the left side of the field towards the right side. The person kicks the ball with their right foot and the ball flies towards the right side of the field. The person then kicks the ball again, and this time the ball flies towards the left side of the field. The person kicks the ball again, and this time the ball flies towards the right side of the field. The person kicks the ball again, and this time the ball flies towards the left side of the field. The person kicks", "gt-answer": "B. moving from right to left", "rating": 0 } ] }, "1034736653_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that there is one woman running in circles while the others run from left to right. Therefore, the woman athletes are running from left to right.", "chatgpt-answer": "C. from left to right", "video-llm-prediction": "The video shows a group of women running on a track. One woman is seen running in circles while the others run from left to right. The video captures the athleticism and endurance of the women as they compete in a race. The consistent information is that the video shows a group of women running on a track.", "gt-answer": "A. from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention the specific direction in which the women athletes are running. It only describes their athleticism, teamwork, and the energy of the race. Therefore, we cannot determine the direction based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a group of women running on a track, with one woman leading the pack. As they run, they pass the baton to each other, showcasing their athleticism and teamwork. The video captures the energy and excitement of the race, with the women pushing themselves to their limits. The sound of their footsteps and the cheers of the crowd add to the atmosphere of the event. Overall, the video is a testament to the power of teamwork and the human spirit of competition.", "gt-answer": "A. from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the women are running in a circle on a track, with one woman leading the pack. This indicates that the women athletes are running in circles.", "chatgpt-answer": "B. in circles", "video-llm-prediction": "A group of women are seen running on a track, with one woman leading the pack. They are all wearing athletic gear and are running in a circle. The video captures the athletes' movements as they run around the track, with the woman in the lead running with determination. The other women are running behind her, with some of them running in circles. The video showcases the athletes' skills and their passion for running.", "gt-answer": "A. from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the women athletes are running on a track, indicating a linear path. It also states that one of them jumps into a pile of sand, suggesting a specific end point for their running. Therefore, we can infer their running direction based on the given information.", "chatgpt-answer": "C. from left to right", "video-llm-prediction": "A group of women are seen running on a track, with one of them jumping into a pile of sand. The video showcases the athleticism and strength of these women as they compete in a track and field event.", "gt-answer": "A. from right to left", "rating": 0 } ] }, "1084153195_reverse": { "direction": [ { "chatgpt-reasoning": "The video description states that the dolphins are swimming towards the shore, but it mentions that the information provided is not consistent with the video. This means that we cannot rely on the video description to determine the actual movement of the dolphins.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows two dolphins swimming towards the shore, but the information provided is not consistent with the video.", "gt-answer": "C. swimming away from the shore", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that one dolphin is swimming towards the shore while the other dolphin is hovering in one place. It also mentions that the dolphins are seen swimming away from the shore.", "chatgpt-answer": "C. swimming away from the shore", "video-llm-prediction": "The video shows two dolphins swimming in the ocean, with one dolphin swimming towards the shore while the other dolphin is hovering in one place. The dolphins are seen swimming away from the shore, and the video captures the beauty of the ocean and the graceful movement of the dolphins.", "gt-answer": "C. swimming away from the shore", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that one of the dolphins is swimming towards the shore while the other is hovering in one place.", "chatgpt-answer": "A. swimming towards the shore", "video-llm-prediction": "Two dolphins are seen swimming in the ocean, one of them is swimming towards the shore while the other is hovering in one place.", "gt-answer": "C. swimming away from the shore", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that two dolphins are swimming towards the shore and another pair is hovering in one place. It also mentions that the dolphins are seen swimming away from the shore as well.", "chatgpt-answer": "A. swimming towards the shore, C. swimming away from the shore", "video-llm-prediction": "Two dolphins are seen swimming towards the shore, while another pair is hovering in one place. The dolphins are seen swimming away from the shore as well.", "gt-answer": "C. swimming away from the shore", "rating": 0 } ] }, "1081092839_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the sun is setting in the background, indicating that it is descending.", "chatgpt-answer": "A. descending", "video-llm-prediction": "The video captures the serene beauty of a snowy field during sunset. The sun is seen setting in the background, casting a warm glow on the snow-covered landscape. The camera pans around the field, showcasing the snow-covered trees and the vast expanse of snow. The video ends with the sun setting in the background, creating a peaceful and calming atmosphere.", "gt-answer": "B. ascending", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sun is seen moving sideways.", "chatgpt-answer": "C. moving sideways", "video-llm-prediction": "The video showcases a serene sunset in a snowy field with a single tree standing tall. The sun is seen moving sideways, and the sky is filled with beautiful colors. The video captures the beauty of nature and the tranquility of the moment.", "gt-answer": "B. ascending", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sun is seen moving sideways.", "chatgpt-answer": "C. moving sideways", "video-llm-prediction": "The video captures the serene beauty of a snowy landscape during sunset. The sun is seen moving sideways, casting a warm glow on the snow-covered trees and hills. The video also features a tree with no leaves, which stands out against the snowy backdrop. The video is a perfect representation of the peacefulness of nature during the winter season.", "gt-answer": "B. ascending", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun is seen moving sideways.", "chatgpt-answer": "C. moving sideways", "video-llm-prediction": "The video showcases a serene sunset in a snowy field with a tree in the foreground. The sun is seen moving sideways, and the sky is painted with warm hues of orange and pink. The snow-covered landscape is illuminated by the setting sun, creating a picturesque scene.", "gt-answer": "B. ascending", "rating": 0 } ] }, "1059462749_reverse": { "direction": [ { "chatgpt-reasoning": "The video description specifically mentions that the person climbing up is seen climbing up the ladder, while the person climbing down is seen climbing down the ladder. This indicates that the person moving is going upwards.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing a ladder in the opposite direction. The man climbing up is wearing a blue shirt and jeans. The man climbing down is wearing a blue shirt and jeans as well. The man climbing up is seen climbing up the ladder while the man climbing down is seen climbing down the ladder.", "gt-answer": "C. upwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is seen climbing up and down the ladder, which indicates that he is moving vertically. Since the video ends with the man climbing the ladder, it can be concluded that he is moving upwards.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man is seen climbing a metal ladder while another man is climbing a metal staircase. The man climbing the ladder is wearing a blue shirt and jeans, while the other man is wearing a blue shirt and blue jeans. The man climbing the ladder is seen climbing up and down the ladder while the other man is climbing up the staircase. The video shows the man climbing the ladder from different angles, and the man climbing the staircase is seen from a distance. The video ends with the man climbing the ladder.", "gt-answer": "C. upwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is climbing a ladder, and it also specifies that there is another man climbing a ladder in the opposite direction. Since the opposite direction would be going against the first man's movement, we can infer that the person is moving upwards.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing a ladder in the opposite direction.", "gt-answer": "C. upwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that both the man climbing the ladder and the man climbing the staircase are seen climbing up and down. Since there is no mention of them moving in any other direction, we can conclude that they are moving upwards.", "chatgpt-answer": "C. upwards", "video-llm-prediction": "A man is seen climbing a metal ladder while another man is climbing a metal staircase. The man climbing the ladder is wearing blue jeans and a blue shirt. The man climbing the staircase is wearing blue jeans and a blue shirt. The man climbing the ladder is seen climbing up and down the ladder. The man climbing the staircase is seen climbing up and down the staircase.", "gt-answer": "C. upwards", "rating": 1 } ] }, "1088279109_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the elevator is seen moving up and down in the video.", "chatgpt-answer": "A. rising", "video-llm-prediction": "The video shows an elevator going up and down in a building. The elevator is seen moving up and down in the video.", "gt-answer": "B. going down", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the elevator starts moving upwards and then stops at a certain point. This indicates that the elevator is rising.", "chatgpt-answer": "A. rising", "video-llm-prediction": "The video showcases an elevator in a building, where it starts moving upwards and then stops at a certain point. The camera then pans around the elevator, providing a clear view of the inside and outside of the building. The video captures the elevator's movement and the surrounding environment, making it an interesting and informative piece for anyone interested in architecture or urban design.", "gt-answer": "B. going down", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the elevator is going up and down in a building. This indicates that the elevator is in motion and moving vertically. The correct answer would be \"rising\" as it accurately describes the upward movement of the elevator.", "chatgpt-answer": "A. rising", "video-llm-prediction": "The video shows an elevator going up and down in a building. The information that is consistent with the video is that the elevator is going up.", "gt-answer": "B. going down", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the elevator is seen going up and down, indicating that it is in motion.", "chatgpt-answer": "A. rising", "video-llm-prediction": "The video showcases an elevator in a building, where it is seen going up and down. The video captures the elevator's movement from different angles, providing a comprehensive view of its operation. The video also highlights the building's architecture and design, with a focus on the elevator's position within the structure. The video's purpose is to provide a visual representation of the elevator's function and its integration into the building's overall design.", "gt-answer": "B. going down", "rating": 0 } ] }, "1096612823_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera starts with a wide shot of the road, then zooms in, pans to the left, zooms out, and finally rotates to provide a 360-degree view. This indicates that the camera is performing multiple movements throughout the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a winding road surrounded by trees and mountains. The camera captures the road from different angles, including a bird's eye view. The video starts with a wide shot of the road, and then zooms in to show the details of the road. The camera then pans to the left, providing a broader view of the surrounding landscape. The video then zooms out, providing a panoramic view of the entire road. Finally, the camera rotates, providing a 360-degree view of the road.", "gt-answer": "A. zooming out", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera starts with a wide shot of the road and captures the changing scenery as the car moves forward. Then, it mentions that the camera zooms out to provide a broader perspective of the road and its surroundings. Based on this information, we can conclude that the camera is zooming out in the video.", "chatgpt-answer": "A. zooming out", "video-llm-prediction": "The video showcases a scenic drive through a winding road surrounded by lush greenery. The camera captures the beauty of the landscape as the car makes its way through the winding road. The video starts with a wide shot of the road, and as the car moves forward, the camera follows its movement, capturing the changing scenery. The camera then zooms out, providing a broader perspective of the road and its surroundings. The video ends with a shot of the car driving away, leaving the viewer with a sense of awe and appreciation for the beauty of nature.", "gt-answer": "A. zooming out", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the road from different angles, including a bird's eye view. This implies that the camera is moving or changing perspective, rather than zooming, rotating, or panning in a specific direction.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a winding road surrounded by trees and mountains. The camera captures the road from different angles, including a bird's eye view. The video also includes a shot of a car driving down the road.", "gt-answer": "A. zooming out", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the beauty of the forest and ends with a panoramic view. This suggests a zooming out effect, where the camera slowly moves away from the subject to reveal a wider view.", "chatgpt-answer": "A. zooming out", "video-llm-prediction": "The video showcases a scenic drive through a forest with winding roads and trees on both sides. The camera captures the beauty of the forest and the drive, with the sound of the engine and the rustling of leaves in the background. The video ends with a panoramic view of the forest.", "gt-answer": "A. zooming out", "rating": 1 } ] }, "1075484900_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the baby is passed from one woman to another, implying a circular motion. Since the video ends with the baby being passed back to the first woman, it can be inferred that the baby is facing forward in relation to the man throughout the video.", "chatgpt-answer": "A. Forward", "video-llm-prediction": "The video shows a woman holding a baby while smiling and talking to the camera. The baby is then passed to another woman who also smiles and talks to the camera. The baby is then passed to a third woman who also smiles and talks to the camera. The video ends with the baby being passed back to the first woman.", "gt-answer": "B. Turning towards the man", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the baby is being passed from the woman to the man, implying that they are facing each other. Therefore, the child is facing forward in relation to the man.", "chatgpt-answer": "A. Forward", "video-llm-prediction": "The video shows a woman holding a baby while a man stands behind them. The woman then kisses the baby and holds him in front of her. The baby is then passed to the man, who holds him in front of the woman. The video captures the joy and love shared between the woman, the baby, and the man.", "gt-answer": "B. Turning towards the man", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the baby is passed around to the woman and another woman who both smile and talk to the camera before being passed to the man who also smiles and talks to the camera. Since all the individuals in the video are smiling and talking towards the camera, it can be inferred that the child is also facing towards the camera, which means the child is facing forward in relation to the man.", "chatgpt-answer": "A. Forward", "video-llm-prediction": "The video shows a woman holding a baby while smiling and talking to the camera. The baby is then passed around to the woman and another woman, who both smile and talk to the camera. The baby is then passed around to a man, who also smiles and talks to the camera.", "gt-answer": "B. Turning towards the man", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman turns the baby towards the camera and the baby looks at the camera, and then turns the baby away from the camera and the baby looks away. This indicates that the baby is facing towards the camera when turned towards it and facing away from it when turned away.", "chatgpt-answer": "C. Turning away from the man", "video-llm-prediction": "A woman is holding a baby in her arms and smiling at the camera. The baby is also smiling and looking at the camera. The woman then turns the baby towards the camera and the baby looks at the camera. The woman then turns the baby away from the camera and the baby looks away.", "gt-answer": "B. Turning towards the man", "rating": 0 } ] }, "1090578917_reverse": { "direction": [ { "chatgpt-reasoning": "The video description does not mention anything about the direction in which the man is leaping. Therefore, we cannot determine the answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man in an orange shirt is seen kicking a soccer ball towards a goal. He is wearing black shorts and is seen running towards the goal. The ball is seen flying towards the goal, and the man is seen running towards the goal. The man is seen kicking the ball towards the goal, and the ball is seen flying towards the goal. The man is seen running towards the goal, and the ball is seen flying towards the goal. The man is seen running towards the goal, and the ball is seen flying towards the goal. The man is seen running towards the goal, and the ball is seen flying", "gt-answer": "A. to his left", "rating": 0 }, { "chatgpt-reasoning": "The video describes that the man in the orange shirt celebrates his goal by jumping up and down. However, the specific direction in which he is leaping is not mentioned in the description.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A man in an orange shirt is seen lying on the ground while another man in a black shirt is standing in front of him. The man in the orange shirt then gets up and kicks the ball towards the goal. The goalkeeper tries to block the ball, but the man in the orange shirt scores a goal. The man in the orange shirt then celebrates his goal by jumping up and down. The video captures the excitement and thrill of a soccer game, with the man in the orange shirt being the star of the show.", "gt-answer": "A. to his left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is running towards the goal post, falls down, and then gets up and kicks the ball towards the goal post. Based on this information, we can deduce that the man is leaping forward towards the goal post.", "chatgpt-answer": "C. forward", "video-llm-prediction": "A man in an orange shirt is seen running towards the goal post and then falls down. He then gets up and kicks the ball towards the goal post.", "gt-answer": "A. to his left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is running towards the goal and then falling down, before getting up and running back to the goal. Based on this information, we can infer that the man is leaping forward towards the goal.", "chatgpt-answer": "C. forward", "video-llm-prediction": "A man in an orange shirt is seen running towards the goal and then falling down. He then gets up and runs back to the goal.", "gt-answer": "A. to his left", "rating": 0 } ] }, "1075338140_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the ball is rolling from left to right and then rolling from right to left on the same surface.", "chatgpt-answer": "D. rolling from right to left", "video-llm-prediction": "The video shows a ball rolling from left to right on a pink surface. The ball is then shown rolling from right to left on the same surface. The video also shows the ball spinning in place on the same surface.", "gt-answer": "D. rolling from right to left", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the ball is rolling from left to right and then rolls back to the left. This indicates that the ball is moving in both directions, from left to right and from right to left.", "chatgpt-answer": "A. forward and backward", "video-llm-prediction": "A ball is seen rolling from left to right on a pink surface. The ball then rolls back to the left and continues to roll from left to right. The video showcases the ball's movement in different directions.", "gt-answer": "D. rolling from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the ball is rolling from left to right, then rolls back from right to left, and finally continues to roll from left to right.", "chatgpt-answer": "C. rolling from left to right", "video-llm-prediction": "A silver ball is seen rolling from left to right on a pink surface. The ball then rolls back from right to left and continues to roll from left to right.", "gt-answer": "D. rolling from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the ball is rolling from left to right and then back from right to left.", "chatgpt-answer": "D. rolling from right to left", "video-llm-prediction": "A silver ball is seen rolling from left to right on a pink surface. The ball then rolls back from right to left.", "gt-answer": "D. rolling from right to left", "rating": 1 } ] }, "1067268403_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the wind turbines are initially stationary and then it transitions to show the wind turbines rotating in different directions. This indicates that the wind turbines are in fact moving and rotating.", "chatgpt-answer": "C. Rotating counterclockwise", "video-llm-prediction": "The video showcases a serene view of wind turbines situated in the ocean. The camera pans around the area, capturing the beauty of the landscape. The wind turbines are stationary, and the camera captures their position in the ocean. The video then transitions to show the wind turbines rotating in different directions, highlighting their movement in the ocean. The camera captures the wind turbines from different angles, providing a comprehensive view of the area. The video ends with a panoramic view of the wind turbines, showcasing their beauty and the vastness", "gt-answer": "C. Rotating counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the viewer can see the blades spinning in the wind. Since the blades are spinning, it implies that the wind turbines are rotating.", "chatgpt-answer": "C. Rotating counterclockwise", "video-llm-prediction": "The video showcases a serene view of wind turbines situated in the ocean. The camera captures the turbines from a distance, and the sound of the waves crashing against the shore can be heard in the background. The camera then zooms in on the turbines, and the viewer can see the blades spinning in the wind. The camera then pans out to show the entire field of turbines, and the viewer can appreciate the vastness of the ocean and the beauty of the turbines. The video is a perfect representation of the power of nature and the ingenuity", "gt-answer": "C. Rotating counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the wind turbines are initially stationary and then later on, they start rotating in different directions, some clockwise and others counterclockwise.", "chatgpt-answer": "C. Rotating counterclockwise", "video-llm-prediction": "The video showcases a large body of water with numerous wind turbines situated in the middle of it. The turbines are stationary, and the water is calm. The sun is setting in the background, casting a warm glow on the scene. The video then transitions to show the wind turbines rotating in different directions, with some rotating clockwise and others counterclockwise. The video captures the beauty of the water and the wind turbines, creating a serene and peaceful atmosphere.", "gt-answer": "C. Rotating counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the wind turbines are stationary.", "chatgpt-answer": "A. Stationary", "video-llm-prediction": "The video showcases a serene view of wind turbines situated near a body of water. The turbines are stationary, and the water is calm. The sun is setting, casting a warm glow on the scene. The camera captures the beauty of the landscape, with the wind turbines standing tall against the backdrop of the water. The video highlights the peacefulness of the location, with the sound of the water and the gentle hum of the turbines providing a calming atmosphere.", "gt-answer": "C. Rotating counterclockwise", "rating": 0 } ] }, "1096007487_reverse": { "direction": [ { "chatgpt-reasoning": "The video description does not provide any information about the movement of the 3D cloud. Therefore, we cannot determine its direction based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a circle with a pink background and a white circle in the middle. The circle is surrounded by a pink and blue cloud. The video also shows a pink and blue cloud with a white circle in the middle.", "gt-answer": "D. rightward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the 3D cloud moves upward, then downward, and finally to the left and right.", "chatgpt-answer": "D. rightward", "video-llm-prediction": "The video showcases a 3D cloud that moves upward, then downward, and finally to the left and right. The cloud is a mesmerizing sight, and the video captures its movement in great detail.", "gt-answer": "D. rightward", "rating": 1 }, { "chatgpt-reasoning": "The video description does not provide any information about the movement of the 3D cloud. Therefore, it is not possible to determine the direction in which the 3D cloud is moving based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of a circle with a pink outline and a blue light in the middle, and a pink light in the center of the circle. The circle is surrounded by a pink light, and there is a pink light in the middle of the circle.", "gt-answer": "D. rightward", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the 3D cloud moves upward, then downward, and finally to the left and right. Thus, the correct answer is D. rightward.", "chatgpt-answer": "D. rightward", "video-llm-prediction": "The video showcases a 3D cloud that moves upward, then downward, and finally to the left and right. The cloud is the main subject of the video, and its movement is the main direction.", "gt-answer": "D. rightward", "rating": 1 } ] }, "1095939659_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the light source starts off by moving in a clockwise direction, then changes direction and starts moving in a counterclockwise direction, and finally changes direction again and starts moving in an upwards direction. It does not mention anything about the light growing or shrinking.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a light source that moves in a circular motion, with the light source appearing to be a neon light. The light source starts off by moving in a clockwise direction, and then it changes direction and starts moving in a counterclockwise direction. The light source then changes direction again and starts moving in an upwards direction. The video captures the light source's movement in a circular motion, with the light source appearing to be a neon light. The video is a visual representation of the light source's movement in a circular motion, with the light source appearing to be a neon light.", "gt-answer": "C. Counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the light moves in a circular motion starting from the center and moving towards the edges of the screen. This indicates that the light is growing outward in a radial direction.", "chatgpt-answer": "D. Upwards", "video-llm-prediction": "The video features a light that moves in a circular motion, starting from the center and moving towards the edges of the screen. The light appears to be a neon-colored glowing light that creates a mesmerizing effect. The light moves in a circular motion, creating a visually appealing effect. The video seems to be showcasing the light's movement and the different directions it can move in. The light's movement is smooth and fluid, creating a sense of motion and energy. Overall, the video is a visually stunning display of light and movement that is sure to captivate view", "gt-answer": "C. Counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the light is shown in a circular motion, moving downwards, and then moving in both clockwise and counterclockwise directions. However, there is no mention or indication of the light growing or changing in size.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A light is shown in a circular motion, moving downwards, then moving in a clockwise direction, and finally moving in a counterclockwise direction.", "gt-answer": "C. Counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the light source is moving in a circular motion and in a downwards direction. It does not provide any information about the light growing or changing size. Therefore, we cannot determine the direction in which the light is growing based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A light source is shown in the video, and it is moving in a circular motion. The light source is moving in a downwards direction, as indicated by Information A.", "gt-answer": "C. Counterclockwise", "rating": 0 } ] }, "1098785169_reverse": { "direction": [ { "chatgpt-reasoning": "The video description does not mention anything about the direction of the galaxy's spin. Therefore, we cannot determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a beautiful view of a galaxy, with the camera panning around to show the different parts of the galaxy. The camera then zooms in on a specific area of the galaxy, providing a closer look at the stars and other celestial objects. The video ends with the camera panning out to show the entire galaxy once again.", "gt-answer": "A. counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the direction of the galaxy's spin.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a galaxy with a bright center, surrounded by a dark background. The camera pans around the galaxy, providing a comprehensive view of its structure. The video highlights the beauty and complexity of the galaxy, with its swirling patterns and intricate details. The camera captures the galaxy from various angles, providing a dynamic and immersive experience for the viewer. The video ends with a final shot of the galaxy, leaving the viewer with a sense of wonder and awe.", "gt-answer": "A. counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "Since the video describes that the camera is panning around the galaxy, we can assume that the camera is in a fixed position and the galaxy is rotating. The description does not provide information about the direction of rotation, so it is impossible to determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a galaxy with a blue light in the middle, surrounded by a black background. The camera pans around the galaxy, showing its different parts. The video ends with a close-up of the galaxy.", "gt-answer": "A. counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the direction of the galaxy's spin.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a galaxy with a bright blue light in the middle, surrounded by a dark background. The camera pans around the galaxy, revealing its intricate details. The video ends with a shot of the galaxy from a distance.", "gt-answer": "A. counterclockwise", "rating": 0 } ] }, "1099984801_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the clouds are moving away from the camera, creating a sense of movement and dynamism.", "chatgpt-answer": "A. moving away from the camera", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with clouds moving away from the camera. The clouds are seen moving away from the camera, creating a mesmerizing view of the mountain range. The video captures the beauty of nature and the serenity of the mountain range. The clouds moving away from the camera create a sense of movement and dynamism, while the snowy mountain range provides a sense of tranquility and peacefulness. The video is a perfect representation of the beauty of nature and the awe-inspiring view of the mountain range.", "gt-answer": "A. moving away from the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the clouds are initially moving away from the camera and then later they are moving towards the camera.", "chatgpt-answer": "C. moving towards the camera", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with clouds moving away from the camera. The camera then pans to the right, revealing a stunning view of the mountain range with clouds moving towards the camera. The video captures the beauty of nature and the majesty of the mountains.", "gt-answer": "A. moving away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the clouds are first moving away from the camera and then moving towards it, creating a visual effect.", "chatgpt-answer": "C. moving towards the camera", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with clouds moving away from the camera. The clouds then move towards the camera, creating a mesmerizing visual effect. The video captures the beauty of nature and the power of the mountains.", "gt-answer": "A. moving away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the clouds in the sky move in different directions. It does not specify whether the clouds are moving away or towards the camera. Therefore, we cannot determine the exact movement of the clouds based on the provided information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a breathtaking view of snow-covered mountains with a blue sky in the background. The camera pans around the mountains, capturing the beauty of the landscape. The clouds in the sky move in different directions, adding to the visual appeal of the video. The serene and picturesque scenery is sure to leave the viewer in awe.", "gt-answer": "A. moving away from the camera", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video starts with a dark sky and bright stars, indicating that it is nighttime. However, towards the end of the video, it shows the sun rising over the mountains, casting a warm glow over the landscape. This suggests that the video is transitioning from night to day and getting brighter.", "chatgpt-answer": "C. getting brighter", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with a starry sky above. The camera pans around the mountains, capturing the beauty of the snow-covered peaks and the vastness of the landscape. The sky is dark, but the stars are bright and twinkling, creating a serene and peaceful atmosphere. The video ends with a shot of the sun rising over the mountains, casting a warm glow over the snowy landscape.", "gt-answer": "C. getting brighter", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sky is dark and the stars are visible throughout the video. There is no mention of any changes in lighting or brightness. Therefore, the correct answer is A. staying the same.", "chatgpt-answer": "A. staying the same", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with a starry sky above. The camera pans around the mountain range, capturing the beauty of the snow-covered peaks and the vastness of the mountain range. The sky is dark, and the stars are visible, creating a serene and peaceful atmosphere. The video ends with a shot of the mountain range at night, with the stars shining brightly against the dark sky.", "gt-answer": "C. getting brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video ends with a shot of the sun setting on the mountains. Therefore, the lighting in the video is getting darker as the sun sets.", "chatgpt-answer": "B. getting darker", "video-llm-prediction": "The video showcases a beautiful mountain range with snow-covered peaks and a clear blue sky. The camera pans across the mountains, capturing the stunning scenery. The video ends with a shot of the sun setting on the mountains.", "gt-answer": "C. getting brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that \"the clouds get darker and brighter.\" This indicates that the brightness of the video is changing.", "chatgpt-answer": "C. getting brighter", "video-llm-prediction": "The video showcases a breathtaking view of a snowy mountain range with a blue sky and a few clouds. The camera pans around the mountain range, and the clouds get darker and brighter. The video captures the beauty of nature and the tranquility of the mountain range.", "gt-answer": "C. getting brighter", "rating": 1 } ] }, "1082419672_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the ship is seen moving in the water and the video ends with the ship sailing away from the camera. This indicates that the ship is moving forwards.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "The video shows a large cruise ship sailing on the ocean. The camera captures the ship from different angles, including from the front and from behind. The ship is seen moving in the water, and the camera captures the ship from different angles. The video also shows the ship from the side, with the camera capturing the ship from a distance. The video ends with the ship sailing away from the camera.", "gt-answer": "B. flying forwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the cruise ship is sailing on the ocean. Based on this information, it can be inferred that the ship is moving forwards in the water.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "The video showcases a large cruise ship sailing on the ocean, with a lighthouse visible in the background. The camera captures the ship from different angles, highlighting its size and grandeur. The ship's movement is smooth and steady, and the water around it is calm and clear. The lighthouse serves as a navigational aid for ships, guiding them safely through the waters. The video provides a serene and picturesque view of the ocean and the ship, making it an ideal watch for anyone looking to escape the hustle and bustle of everyday life.", "gt-answer": "B. flying forwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ship is seen moving in the water, which implies a forward movement.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "The video shows a large cruise ship sailing on the ocean. The camera captures the ship from different angles, including from the front and side. The ship is seen moving in the water, and the camera captures the ship from a distance. The video also shows the ship from a close-up perspective, highlighting its size and grandeur. The ship's design and features are also visible in the video. Overall, the video provides a comprehensive view of the cruise ship and its surroundings.", "gt-answer": "B. flying forwards", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the cruise ship is sailing on the ocean, which implies a forward movement. There is no mention of the bird flying in the opposite direction or hovering in the video description.", "chatgpt-answer": "B. flying forwards", "video-llm-prediction": "The video showcases a large cruise ship sailing on the ocean, with a lighthouse visible in the background. The camera captures the ship from different angles, highlighting its impressive size and design. The video also features a bird flying over the water, adding a touch of nature to the scene. Overall, the video provides a stunning view of the cruise ship and its surroundings, making it an excellent visual experience for viewers.", "gt-answer": "B. flying forwards", "rating": 1 } ] }, "1058985719_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the airplane is seen from below, indicating that the airplane is flying from top to bottom.", "chatgpt-answer": "C. top to bottom", "video-llm-prediction": "A large airplane is seen flying through the sky, with the sun shining through the clouds. The plane is seen from below, and the sun is shining through the clouds.", "gt-answer": "C. top to bottom", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the plane is seen from below, which means the camera is looking up at the airplane. Therefore, the airplane is flying from top to bottom.", "chatgpt-answer": "C. top to bottom", "video-llm-prediction": "The video showcases a large airplane flying through the sky, with the sun shining through the clouds. The plane is seen from below, and the sun is shining through the clouds. The video captures the beauty of the sky and the plane's journey through it.", "gt-answer": "C. top to bottom", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the plane is seen from below, which indicates that the plane is flying from top to bottom.", "chatgpt-answer": "C. top to bottom", "video-llm-prediction": "A plane flies through the sky, with the sun shining through the clouds. The plane is seen from below, and the sun is shining through the clouds. The plane is seen from below, and the sun is shining through the clouds. The plane is seen from below, and the sun is shining through the clouds.", "gt-answer": "C. top to bottom", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the plane is flying through the sky, soaring high above the clouds. Since there is no mention of the plane's movement in a specific direction (e.g., ascending or descending), we can assume it is flying horizontally. Additionally, there is no information provided regarding the plane moving from one side to another, so we cannot determine whether it is flying right to left or left to right.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A plane flies through the sky, soaring high above the clouds. The sun shines brightly in the background, casting a warm glow on the scene. The plane's wings are spread wide, and its shadow can be seen on the clouds below. The sound of the engine is audible, and the wind rushes past the plane as it continues on its journey.", "gt-answer": "C. top to bottom", "rating": 0 } ] }, "1055413730_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the Earth is spinning in space. According to our conventional understanding, when referring to the rotation of the Earth, the direction is usually described as from west to east, or counterclockwise when viewed from above the North Pole. Therefore, the correct answer would be leftwards.", "chatgpt-answer": "C. Leftwards", "video-llm-prediction": "The video shows a close-up of the Earth spinning in space. The camera captures the rotation of the Earth from different angles, providing a comprehensive view of the planet's movement. The video emphasizes the beauty and complexity of our planet, highlighting the Earth's rotation and the vastness of space.", "gt-answer": "C. Leftwards", "rating": 1 }, { "chatgpt-reasoning": "The video mentions that the camera captures the movement of the Earth's surface as it rotates. Since the Earth rotates from west to east, the direction of rotation can be described as leftwards when viewed from above the North Pole.", "chatgpt-answer": "C. Leftwards", "video-llm-prediction": "The video showcases the beauty and complexity of our planet, Earth. The camera captures the vibrant colors of the Earth's surface, highlighting the contrast between the blue oceans and the brown land masses. The video also emphasizes the Earth's rotation, with the camera capturing the movement of the Earth's surface as it rotates. The video concludes with a stunning view of the Earth from space, showcasing the planet's beauty and the vastness of the universe.", "gt-answer": "C. Leftwards", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the globe is spinning in different directions, including upwards, downwards, leftwards, and rightwards. However, it does not provide any specific reference to the direction of the Earth's rotation.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A video of a spinning globe is shown, with the words \"Earth\" and \"Planet\" appearing on the screen. The video then shows the globe spinning in different directions, including upwards, downwards, leftwards, and rightwards.", "gt-answer": "C. Leftwards", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the direction in which the planet Earth is spinning. Spinning is not mentioned in the description, so it is not possible to determine the correct answer.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a breathtaking view of the Earth from space, with the camera capturing the beauty of our planet from various angles. The video begins with a close-up shot of the Earth, followed by a panoramic view of the entire planet. The camera then zooms out to show the Earth from a distance, with the sun shining brightly in the background. The video captures the Earth's vibrant colors and the vastness of our planet. The camera then zooms in to show the Earth's surface, with the oceans, continents, and cities visible.", "gt-answer": "C. Leftwards", "rating": 0 } ] }, "1081684532_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that some of the asteroids are flying towards the camera.", "chatgpt-answer": "C. flying towards the camera", "video-llm-prediction": "The video showcases a group of asteroids flying away from the camera, with some of them flying towards the camera. The video captures the movement of the asteroids in the dark space, creating a mesmerizing visual experience. The sound of the asteroids colliding with each other can be heard, adding to the immersive experience. The video is a perfect representation of the beauty and power of the universe.", "gt-answer": "A. flying away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the asteroids are \"flying away from the camera\" and \"some of them flying to the left.\" This means that the asteroids are moving in two different directions - away from the camera and to the left.", "chatgpt-answer": "A. flying away from the camera and B. flying to the left", "video-llm-prediction": "The video showcases a group of asteroids flying away from the camera, with some of them flying to the left and others flying towards the camera. The video captures the beauty and movement of the asteroids as they soar through space.", "gt-answer": "A. flying away from the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera starts with a close-up shot of a large rock and then transitions to a wider shot of several asteroids flying away from the camera. It also mentions that the camera focuses on a single asteroid flying towards the camera and the video ends with the asteroid flying away from the camera. Based on this information, we can infer that the direction of the asteroids in the video is \"flying away from the camera\".", "chatgpt-answer": "A. flying away from the camera", "video-llm-prediction": "A video showcasing the movement of asteroids in space. The video starts with a close-up shot of a large rock, and then transitions to a wider shot of several asteroids flying away from the camera. The camera then focuses on a single asteroid flying towards the camera, and the video ends with the asteroid flying away from the camera.", "gt-answer": "A. flying away from the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the asteroids are \"flying away from the camera.\" Therefore, option A. flying away from the camera is the correct answer.", "chatgpt-answer": "A. flying away from the camera", "video-llm-prediction": "The video showcases a group of asteroids flying away from the camera, with some of them flying to the left and others flying towards the camera. The video captures the beauty and movement of the asteroids as they soar through space.", "gt-answer": "A. flying away from the camera", "rating": 1 } ] }, "23391142_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the video captures the players' movements as they run around the court, indicating that the camera is most likely following their movements. Therefore, the direction of panning should be in the same direction as the players' movements.", "chatgpt-answer": "D. To the right", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The video captures the players' movements as they run around the court, trying to keep up with the shuttlecock. The players are seen hitting the shuttlecock with their rackets, and the shuttlecock is seen flying through the air. The video also shows the players' expressions as they play the game. Overall, the video captures the excitement and energy of the game of badminton.", "gt-answer": "C. To the left", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the direction of the panning. Since there is no information provided, we cannot determine the correct answer.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The game continues with the players hitting the shuttlecock with their rackets. The players are seen running around the court to keep up with the shuttlecock. The game continues with the players hitting the shuttlecock with their rackets. The players are seen running around the court to keep up with the shuttlecock. The game continues with the players hitting the shuttlecock with their rackets. The players are seen running around the court", "gt-answer": "C. To the left", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the direction in which the video is panning. We cannot determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a game of tennis being played by four people on a court. The players are seen hitting the ball back and forth to each other while the camera captures their movements. The video ends with the players walking away from the court.", "gt-answer": "C. To the left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video captures the players' movements as they move around the court, indicating that the camera is following their movements. It does not mention any specific direction of panning.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of people playing badminton in a gymnasium. The players are seen hitting the shuttlecock back and forth over the net. The video captures the players' movements as they move around the court, trying to outmaneuver their opponents. The players' skills are evident as they hit the shuttlecock with precision and speed. The gymnasium provides a spacious area for the players to move around freely. The video is a great representation of the game of badminton and the skills required to play it.", "gt-answer": "C. To the left", "rating": 0 } ] }, "1053758117_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera starts with a zoom out from a 3D digital brain, then zooms in on the brain, and finally zooms out again. This indicates that what is happening in the video is a sequence of zooming in and out of a 3D digital brain.", "chatgpt-answer": "C. Zoom into a 3D digital brain", "video-llm-prediction": "The video starts with a zoom out from a 3D digital brain, which is the main focus of the video. The camera then zooms in on the brain, providing a closer look at its intricate structure. The video then zooms out again, giving a broader perspective of the brain. The video ends with a zoom out from the entire video. The video showcases the beauty and complexity of the human brain, providing a fascinating glimpse into its inner workings.", "gt-answer": "A. Zoom out from a 3D digital brain", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with a zoom out from a 3D digital brain, which is then followed by a zoom in on the same brain. Therefore, the correct answer is A. Zoom out from a 3D digital brain.", "chatgpt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "The video starts with a zoom out from a 3D digital brain, which is then followed by a zoom in on the same brain. The video then shows a zoom out from a 3D digital brain, which is followed by a zoom in on the same brain. The video then shows a zoom out from a 3D digital brain, which is then followed by a zoom in on the same brain. The video then shows a zoom out from a 3D digital brain, which is then followed by a zoom in on the same brain. The video then shows a zoom out from a 3D digital brain, which is", "gt-answer": "A. Zoom out from a 3D digital brain", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with a zoom out from a 3D digital brain, then zooms in to show a close-up of the brain, and finally ends with a zoom out from the entire brain.", "chatgpt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "The video starts with a zoom out from a 3D digital brain, and then zooms in to show a close-up of the brain. The video then zooms out again, showing the entire brain. The video ends with a zoom out from the entire brain.", "gt-answer": "A. Zoom out from a 3D digital brain", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the video showcases a 3D digital brain zooming in and out, with a focus on the brain's intricate structure. It specifically mentions a zoom out from a 3D digital brain, zooming in to reveal the brain's network, and then zooming out again.", "chatgpt-answer": "A. Zoom out from a 3D digital brain", "video-llm-prediction": "The video showcases a 3D digital brain zooming in and out, with a focus on the brain's intricate structure. The video begins with a zoom out from a 3D digital brain, providing a comprehensive view of the brain's complexity. The camera then zooms in, revealing the brain's intricate network of neurons and blood vessels. The video then zooms out again, providing a broader perspective of the brain's structure. Overall, the video highlights the brain's remarkable complexity and the importance of understanding its structure to better understand its function.", "gt-answer": "A. Zoom out from a 3D digital brain", "rating": 1 } ] }, "1106668103_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans out to show the entire coffee bean, indicating a movement away from the close-up shot. This suggests that the direction of movement in the video is moving backward.", "chatgpt-answer": "C. moving backward", "video-llm-prediction": "The video showcases a close-up of coffee beans, which are then shown being ground up. The camera then pans out to show the entire coffee bean. The video ends with a close-up of the coffee beans.", "gt-answer": "C. moving backward", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans out to show the entirety of the coffee beans, indicating a movement away from the close-up shot. This suggests that the direction of movement in the video is moving backward.", "chatgpt-answer": "C. moving backward", "video-llm-prediction": "The video showcases a close-up of coffee beans, which are then rotated to reveal their different sides. The camera then pans out to show the entirety of the coffee beans.", "gt-answer": "C. moving backward", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the beans, providing a detailed view of their unique features. This implies that there is movement in the video.", "chatgpt-answer": "B. moving forward", "video-llm-prediction": "The video showcases a close-up of coffee beans, with a focus on their texture and appearance. The camera pans around the beans, providing a detailed view of their unique features. The video also includes a shot of a person holding a cup of coffee, which adds a human element to the scene. The video ends with a shot of the coffee beans, emphasizing their importance in the coffee-making process.", "gt-answer": "C. moving backward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the coffee beans and the resulting coffee is poured into a cup. Both of these actions indicate movement in the video. \"Staying still\" is contradicted by the camera panning around the coffee beans, and \"moving forward\" is contradicted by the action of pouring coffee into a cup. Therefore, the correct answer is \"C. moving backward\", as it implies a reverse motion from the initial panning movement around the coffee beans.", "chatgpt-answer": "C. moving backward", "video-llm-prediction": "A close-up shot of coffee beans is shown, and the camera pans around them. The beans are then ground up, and the resulting coffee is poured into a cup. The video ends with the cup of coffee being enjoyed.", "gt-answer": "C. moving backward", "rating": 1 } ] }, "1057163434_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the chef starts by putting a burger patty on a bun, which implies that the bread is being used as a base for the burger. However, it also states that the video ends with the chef throwing the burger away. This suggests that the chef is likely removing the bread from the top of the burger.", "chatgpt-answer": "A. removing it from the top of the burger", "video-llm-prediction": "The video showcases a chef preparing a burger. The chef starts by putting a burger patty on a bun and then adds some vegetables. The chef then adds some sauce on top of the burger and puts it on a plate. The video ends with the chef throwing the burger away.", "gt-answer": "A. removing it from the top of the burger", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the chef is making a burger by putting toppings on it and ends with the chef throwing the burger away. Since the bread is mentioned in the description and the chef throws the burger away, it can be concluded that the chef is throwing the bread away.", "chatgpt-answer": "D. throwing it away", "video-llm-prediction": "A chef is shown making a burger by putting meat on a bun and adding various toppings. The video ends with the chef throwing the burger away.", "gt-answer": "A. removing it from the top of the burger", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef is making a burger by putting it together with various ingredients. Since the bread is an essential part of the burger, it is logical to assume that the chef is putting the bread on top of the burger.", "chatgpt-answer": "B. putting it on top of the burger", "video-llm-prediction": "A chef is shown making a burger by putting it together with various ingredients. He then takes a bite of the burger.", "gt-answer": "A. removing it from the top of the burger", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef is putting meat, cheese, and vegetables inside the bun, which implies that the bread is being used as a container for the burger ingredients.", "chatgpt-answer": "C. putting it inside the burger", "video-llm-prediction": "A chef is shown making a burger by putting meat, cheese, and vegetables inside the bun. He then puts the burger on a plate and throws the used vegetables away.", "gt-answer": "A. removing it from the top of the burger", "rating": 0 } ] }, "1100319395_reverse": { "direction": [ { "chatgpt-reasoning": "From the video description, it is mentioned that a white circle with a black dot is shown, then another white circle with a black dot moving towards the camera, and finally a white circle with a black dot moving away from the camera. There is no indication of any clockwise or counter-clockwise movement mentioned in the video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A white circle with a black dot in the center is shown, and then a white circle with a black dot moving towards the camera. The video then shows a white circle with a black dot moving away from the camera.", "gt-answer": "C. counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the circular pattern moves towards the camera first, then it moves away from the camera, and finally, it moves towards the camera again. This indicates that the circular pattern alternates between moving towards and away from the camera.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a circular pattern that moves towards the camera, followed by a pattern that moves away from the camera. The video then displays a circular pattern that moves towards the camera again. The video concludes with a circular pattern that moves away from the camera.", "gt-answer": "C. counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the white circle with a black dot is shown followed by a white circle with a black dot moving towards the camera and then a white circle with a black dot moving away from the camera. This indicates that the circular pattern is moving in the same direction as the dot, which is towards the camera and then away from the camera.", "chatgpt-answer": "B. moving towards the camera", "video-llm-prediction": "A white circle with a black dot in the center is shown, followed by a white circle with a black dot moving towards the camera. The video then shows a white circle with a black dot moving away from the camera.", "gt-answer": "C. counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the circular pattern starts with a white circle with a black dot in the center, followed by a white circle with a black dot moving towards the camera, and then a white circle with a black dot moving away from the camera. This sequence indicates that the circular pattern is rotating in a specific direction.", "chatgpt-answer": "A. clockwise", "video-llm-prediction": "A white circle with a black dot in the center is shown, followed by a white circle with a black dot moving towards the camera. The video then shows a white circle with a black dot moving away from the camera.", "gt-answer": "C. counter-clockwise", "rating": 0 } ] }, "1101200293_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans around the carrier, which indicates a rotational motion. It also mentions that the carrier is moving down the water, implying a forward motion. Therefore, the camera motion can be described as a combination of rotation and forward motion.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a large aircraft carrier with several fighter jets parked on it. The camera pans around the carrier, showing the jets parked in a straight line. The video then shows the carrier moving down the water, with the jets still parked in a straight line. The video ends with the carrier still moving down the water.", "gt-answer": "A. counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"the camera pans around the carrier\" and also mentions a transition to a scene capturing the movement of the carrier. This implies that the camera is moving in a circular motion around the carrier.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video showcases a large aircraft carrier with multiple fighter jets parked on its deck. The camera pans around the carrier, capturing the impressive size and structure of the vessel. The video then transitions to a scene where the carrier is sailing on the water, with the fighter jets still parked on its deck. The camera captures the movement of the carrier as it sails through the water, highlighting the power and grace of the vessel. The video concludes with a shot of the carrier sailing on the water, with the fighter jets still parked", "gt-answer": "A. counterclockwise", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the camera pans around the carrier, indicating a circular motion. However, the specific direction of the camera motion is not mentioned.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a large aircraft carrier with several fighter jets parked on it. The camera pans around the carrier, showing the jets parked in a line. The video then shows the carrier moving down a road, with the jets still parked in a line. The video ends with the carrier docked at a pier.", "gt-answer": "A. counterclockwise", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the camera pans around the carrier, showcasing its size and structure. It also transitions to different views of the carrier from below and above. This implies that the camera is moving in a circular motion around the aircraft carrier.", "chatgpt-answer": "A. counterclockwise", "video-llm-prediction": "The video showcases a large aircraft carrier with numerous fighter jets parked on its deck. The camera pans around the carrier, capturing the impressive size and structure of the vessel. The video then transitions to a view of the carrier from below, showcasing the sheer size of the aircraft carrier. The camera then pans around the deck of the carrier, highlighting the various fighter jets parked on the deck. The video concludes with a view of the carrier from above, showcasing the impressive size and structure of the vessel.", "gt-answer": "A. counterclockwise", "rating": 1 } ] }, "1072453637_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans to different angles of the fighter jet, including the back, downwards, upwards, and front.", "chatgpt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "The video showcases a fighter jet flying through the sky, with the camera capturing different angles of the jet. The video starts with the jet flying in the sky, and then the camera pans to the back of the jet. The camera then pans downwards around the jet, providing a unique perspective of the jet's movement. The video then pans upwards around the jet, offering a different angle of the jet's flight. Finally, the camera pans to the front of the jet, providing a clear view of the jet's nose. Overall, the video provides a comprehensive view of the", "gt-answer": "D. panning to the front of a fighter jet", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states the different directions of the camera panning, including panning to the back of the jet, downwards around the jet, upwards around the jet, and to the front of the jet.", "chatgpt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "A fighter jet is seen flying in the sky, with the camera panning to the back of the jet. The camera then pans downwards around the jet, showcasing its impressive maneuverability. The camera then pans upwards around the jet, highlighting its speed and agility. Finally, the camera pans to the front of the jet, providing a clear view of the cockpit and the pilot inside. The video captures the beauty and power of the fighter jet in action.", "gt-answer": "D. panning to the front of a fighter jet", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera is panning around the fighter jet. Since the different angles of the jet are shown, including from the front and back, it can be inferred that the camera is panning to the back of the fighter jet.", "chatgpt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "The video shows a fighter jet flying through the sky, with the camera panning around it. The jet is seen from different angles, including from the front and back. The sky is clear and blue, with no clouds or other objects visible. The sound of the jet's engine can be heard throughout the video.", "gt-answer": "D. panning to the front of a fighter jet", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans to different parts of the fighter jet, including the back, downwards, upwards, and the front.", "chatgpt-answer": "A. panning to the back of a fighter jet", "video-llm-prediction": "A fighter jet is seen flying in the sky, with the camera panning to the back of the jet. The camera then pans downwards around the jet, showcasing its impressive maneuverability. The camera then pans upwards around the jet, highlighting its speed and agility. Finally, the camera pans to the front of the jet, showcasing its powerful engine and advanced technology. Overall, the video captures the thrilling experience of flying in a fighter jet and the incredible capabilities of modern aviation technology.", "gt-answer": "D. panning to the front of a fighter jet", "rating": 0 } ] }, "3396473605_reverse": { "direction": [ { "chatgpt-reasoning": "There is no information in the video description about the stars disappearing or the direction in which they disappear.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows five stars arranged in a circle, with each star having a different color. The stars are arranged in a circular pattern, with the colors of the stars being blue, green, yellow, red, and purple. The video is a simple yet visually appealing display of the five stars.", "gt-answer": "A. from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the stars appear from right to left. Since the question is asking about the direction in which the stars disappear, we can infer that they will also disappear from right to left.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "The video features a five-star rating system, with the stars appearing from right to left. The video showcases various scenes, including a man standing in front of a building, a car driving down a road, and a person walking down a street. The video also includes a scene of a person sitting on a bench. The video concludes with a scene of a person standing in front of a building.", "gt-answer": "A. from right to left", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the five stars appear from right to left. If the stars are appearing from right to left, it can be inferred that they will disappear in the same direction.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "The video features a five-star rating system, with the stars appearing from right to left.", "gt-answer": "A. from right to left", "rating": 1 }, { "chatgpt-reasoning": "The video description doesn't provide explicit information about the direction in which the five stars disappear. Therefore, it is not possible to determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a five-star rating system, with the stars arranged in a circular pattern. The video begins with a blue screen displaying the five-star rating system, followed by a black screen with the same rating system. The video then shows a man using a computer, with the five-star rating system displayed on the screen. The video concludes with a black screen featuring the five-star rating system.", "gt-answer": "A. from right to left", "rating": 0 } ] }, "1086820415_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the large wave is moving vertically towards the top of the screen.", "chatgpt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "The video shows a large wave moving vertically towards the top of the screen. The wave is so large that it covers the entire screen. The wave is moving at a very fast pace and is creating a lot of white foam in its wake. The water is a deep blue color, and the sky is a clear blue. The video captures the power and beauty of the ocean, and it is a sight to behold.", "gt-answer": "A. moving vertically towards the top of the screen", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the large wave is moving vertically towards the top of the screen. It does not mention any horizontal motion or movement towards the bottom or left side of the screen.", "chatgpt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "The video showcases a large wave moving vertically towards the top of the screen, followed by a series of waves moving horizontally towards the right side of the screen. The waves continue to move towards the bottom of the screen, creating a mesmerizing visual experience.", "gt-answer": "A. moving vertically towards the top of the screen", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the large wave is moving vertically towards the top of the screen.", "chatgpt-answer": "A. moving vertically towards the top of the screen", "video-llm-prediction": "The video shows a large wave moving vertically towards the top of the screen.", "gt-answer": "A. moving vertically towards the top of the screen", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the large wave moves in different directions. It first moves vertically towards the top of the screen, then horizontally towards the right side, followed by vertically towards the bottom, and finally horizontally towards the left side.", "chatgpt-answer": "Option D. moving horizontally towards the left side of the screen.", "video-llm-prediction": "The video showcases a large wave moving vertically towards the top of the screen, followed by the wave moving horizontally towards the right side of the screen. The wave then moves vertically towards the bottom of the screen, and finally, it moves horizontally towards the left side of the screen.", "gt-answer": "A. moving vertically towards the top of the screen", "rating": 0 } ] }, "1073831006_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that some zebras are running from right to left, while others are running from left to right.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them running towards the water. The zebras are seen running in different directions, with some running from right to left, while others are running from left to right. The video captures the zebras in motion, with their distinct black and white stripes visible as they run through the field. The sound of their hooves pounding against the ground can be heard, adding to the immersive experience of the video. Overall, the video showcases the beauty and grace of these animals in their natural habitat.", "gt-answer": "A. from right to left", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the zebras are running in different directions, some towards the water and others away from it. However, there is no specific mention of the direction from top to bottom or vice versa.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them running towards the water. The zebras are seen running in different directions, with some running towards the water and others running away from it. The field is surrounded by tall grass, and the zebras are running with great speed. The water is calm, and the zebras are running with great enthusiasm. The video captures the beauty of the zebras and their natural habitat.", "gt-answer": "A. from right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the zebras are running from right to left.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "A group of zebras are seen running through a field of tall grass. They are running from right to left.", "gt-answer": "A. from right to left", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that some zebras are running from right to left, while others are running from left to right.", "chatgpt-answer": "A. from right to left", "video-llm-prediction": "A group of zebras are seen running through a field, with some of them running towards the water. The zebras are seen running in different directions, with some running from right to left, while others are running from left to right. The video captures the zebras in motion, with their distinct black and white stripes visible as they run. The field is vast and open, with the zebras running freely in the wild. The video provides a glimpse into the natural behavior of zebras in their natural habitat.", "gt-answer": "A. from right to left", "rating": 1 } ] }, "1024867412_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the dog is seen turning left and right while driving the car, and the video ends with the dog driving the car backward. Thus, the car is driving backward.", "chatgpt-answer": "D. Going backward", "video-llm-prediction": "A dog is seen driving a car in the video. The dog is wearing sunglasses and a collar. The car is seen driving on a road with other cars around it. The dog is seen turning left and right while driving the car. The video ends with the dog driving the car backward.", "gt-answer": "A. Taking a left turn", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the dog is seen taking a left turn, going straight, taking a right turn, and going backward while driving the car.", "chatgpt-answer": "D. Going backward", "video-llm-prediction": "A dog wearing sunglasses is seen driving a car on a road. The dog is seen taking a left turn, going straight, taking a right turn, and going backward. The video captures the dog's playful and adventurous spirit as it enjoys the ride.", "gt-answer": "A. Taking a left turn", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the dog is taking a left turn while driving the car.", "chatgpt-answer": "A. Taking a left turn", "video-llm-prediction": "A dog is seen driving a car and taking a left turn.", "gt-answer": "A. Taking a left turn", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the dog is driving a car and describes its movements, including taking a left turn, going straight, taking a right turn, and going backward.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A dog wearing sunglasses is seen driving a car on a street, taking a left turn, going straight, taking a right turn, and going backward.", "gt-answer": "A. Taking a left turn", "rating": 0 } ] }, "1076877854_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the robotic arms are seen moving around the field. Since it doesn't specify any specific direction, we cannot determine which direction the closest robotic arm is moving from the camera's point of view.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a group of robotic arms working in a field. The arms are seen moving around the field, and one of the arms is shown cutting the grass. The video also shows the arms moving around the field, and one of the arms is shown cutting the grass. The video ends with the arms moving around the field.", "gt-answer": "D. To the left side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the robots are moving around the field and planting seeds in a very precise manner. The question asks about the direction of the closest robotic arm from the camera's point of view. Since the video description does not provide any specific information about the movement direction, it is impossible to determine the correct answer.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a green field with several white robots that are planting seeds in the soil. The robots are seen moving around the field, and they are planting seeds in a very precise manner. The video also shows the robots moving around the field, and they are planting seeds in a very precise manner. The video is a great example of how technology can be used to make the world a better place.", "gt-answer": "D. To the left side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the robotic arm is moving towards the camera and away from it. Therefore, the closest robotic arm is moving towards the camera's point of view.", "chatgpt-answer": "B. Towards the camera", "video-llm-prediction": "A robotic arm is seen in a field of plants, moving around and tending to the plants. The arm is seen moving towards the camera and away from it, as well as towards the right side of the screen.", "gt-answer": "D. To the left side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the white robotic arm is seen moving around a green field. Since there is no mention of the camera's position in relation to the arm, we cannot determine its exact direction. However, based on the given choices, the closest robotic arm could be moving either towards or away from the camera.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A white robotic arm is seen moving around a green field, picking up a leaf and placing it on a scale. The arm then moves to another plant and repeats the process.", "gt-answer": "D. To the left side of the screen", "rating": 0 } ] }, "1100468035_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera starts with a zooming backward shot, then it pans to the left, then it zooms forward. It continues to pan to the right, and then pans to the left again.", "chatgpt-answer": "D. panning left", "video-llm-prediction": "The video starts with a zooming backward shot of a room, and then it pans to the left. The camera then zooms forward, and we see a door with a camera on it. The camera then pans to the right, and we see a door with a camera on it. The camera then pans to the left, and we see a door with a camera on it. The camera then pans to the right, and we see a door with a camera on it. The camera then pans to the left, and we see a door with a camera on it. The camera then pans to the", "gt-answer": "A. zooming backward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions the movement of the camera throughout the video, stating that it pans to the right, zooms backward, zooms forward, and pans to the left. Therefore, the correct answer is the direction that matches the given movements.", "chatgpt-answer": "C. tracking right", "video-llm-prediction": "The video showcases a large room with blue walls and white doors, where a person is seen walking in the room. The camera then pans to the right, revealing a long row of white doors. The video then zooms backward, providing a closer look at the details of the room. The camera then zooms forward, providing a broader view of the room. The video then pans to the left, revealing a long row of white doors. The video then zooms backward, providing a closer look at the details of the room. The camera then zooms forward, providing a broader view of the", "gt-answer": "A. zooming backward", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera starts with a zooming backward shot, then zooms forward to show the entire room, and finally zooms backward again to show the entire room.", "chatgpt-answer": "A. zooming backward", "video-llm-prediction": "The video starts with a zooming backward shot of a room, and then zooms forward to show the entire room. The camera then pans left to show the entire room. The video then zooms backward to show the entire room.", "gt-answer": "A. zooming backward", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans left and right, and zooms in and out of the room. So, the camera is panning left and right.", "chatgpt-answer": "D. panning left", "video-llm-prediction": "The video showcases a room with blue walls and a door, and a hallway with blue walls and doors. The camera pans left and right, and zooms in and out of the room.", "gt-answer": "A. zooming backward", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description states that the door is shown in various positions, including being closed and gradually opening. This indicates that the door is not remaining closed or closing, but rather gradually opening.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video showcases a door that gradually opens, revealing a room with a blue light. The door is shown in various positions, including being closed and gradually opening. The video also features a blue light that illuminates the room.", "gt-answer": "B. closing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white door gradually opens and then closes. This indicates that the door is in motion, specifically opening and closing.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video showcases a white door that gradually opens, revealing a blue-lit room with numerous white cabinets. The door then closes, and the video ends.", "gt-answer": "B. closing", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the door is gradually opening.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video shows a door gradually opening.", "gt-answer": "B. closing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the door gradually opens, so option C. gradually opening is the correct answer.", "chatgpt-answer": "C. gradually opening", "video-llm-prediction": "The video showcases a door that gradually opens, revealing a room with a blue light. The door then closes, and the video ends.", "gt-answer": "B. closing", "rating": 0 } ] }, "3411806181_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the person is charging his car battery using a portable charger. Since the person is connecting the charger to the car battery, it can be inferred that he is moving the charging gun towards the car in order to connect it.", "chatgpt-answer": "C. Towards the car", "video-llm-prediction": "A man is seen charging his car battery using a portable charger. He connects the charger to the car battery and then uses the charger to charge his phone.", "gt-answer": "A. Away from the car", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person moves the charger to a different location. Since the charger is connected to the car battery, the person is most likely moving the charging gun towards the car.", "chatgpt-answer": "C. Towards the car", "video-llm-prediction": "A man is seen charging his car battery using a portable charger. He connects the charger to his car and begins to charge the battery. The man then moves the charger to a different location and continues to charge the battery. He repeats this process a few times, ensuring that the battery is fully charged. The video emphasizes the importance of keeping your car battery charged and ready to go at all times.", "gt-answer": "A. Away from the car", "rating": 0 }, { "chatgpt-reasoning": "In the video description, it is mentioned that the person disconnects the charger and puts it in his pocket. Later on, he takes out the charger from his pocket and puts it in the trunk of the car. This indicates that the person is moving towards the car while carrying the charging gun.", "chatgpt-answer": "C. Towards the car", "video-llm-prediction": "A man is seen charging his car battery with a portable charger. He connects the charger to his car battery and starts charging it. After a while, he disconnects the charger and puts it in his pocket. He then walks towards the car and opens the trunk. He takes out the charger from his pocket and puts it in the trunk. He then closes the trunk and walks towards the camera.", "gt-answer": "A. Away from the car", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man moves the charger to a different location. Since he is charging his car battery, it can be inferred that he would move the charging gun towards the car to continue charging the battery.", "chatgpt-answer": "C. Towards the car", "video-llm-prediction": "A man is seen charging his car battery using a portable charger. He connects the charger to his car and begins to charge the battery. The man then moves the charger to a different location and continues to charge the battery.", "gt-answer": "A. Away from the car", "rating": 0 } ] }, "1073914229_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the first train is moving towards the camera and the second train is moving away from the camera. Therefore, the trains are moving in opposite directions.", "chatgpt-answer": "C. away from each other", "video-llm-prediction": "The video shows two trains moving in opposite directions on the same track. The first train is seen moving towards the camera, while the second train is moving away from the camera. The video captures the movement of the trains as they pass each other on the track.", "gt-answer": "C. away from each other", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the trains are \"traveling in opposite directions\", which means they are moving away from each other.", "chatgpt-answer": "C. away from each other", "video-llm-prediction": "The video showcases two trains traveling in opposite directions on parallel tracks, surrounded by lush green fields and trees. The serene landscape provides a picturesque backdrop for the trains as they pass each other. The video captures the beauty of nature and the marvel of human engineering.", "gt-answer": "C. away from each other", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the two trains are passing each other on the tracks. This implies that the trains are moving in opposite directions, which means they are moving away from each other.", "chatgpt-answer": "C. away from each other", "video-llm-prediction": "The video shows two trains traveling in the same direction, passing each other on the tracks. The scenery around the tracks is also visible, with trees and fields in the background.", "gt-answer": "C. away from each other", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the two trains are traveling in opposite directions on the same track. This means they are moving away from each other.", "chatgpt-answer": "C. away from each other", "video-llm-prediction": "The video showcases two trains traveling in opposite directions on the same track, with trees and fields in the background.", "gt-answer": "C. away from each other", "rating": 1 } ] }, "1093139559_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions three different camera motions: zooming in on three football players, panning left, and panning right. It also mentions that the video zooms out from the three football players. However, it does not mention any other camera motions. Therefore, the correct answer is D. Zooming out from three football players.", "chatgpt-answer": "D. Zooming out from three football players", "video-llm-prediction": "The video starts with a zooming in on three football players. The camera then pans left, showing the entire stadium. The camera then pans right, showing the entire stadium. The video then zooms out from the three football players. The stadium is filled with cheering fans, and the players are seen walking around the field. The video captures the excitement and energy of a live football game.", "gt-answer": "D. Zooming out from three football palyers", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention any specific camera motion such as zooming in or out. However, it does describe the men walking onto the field, playing soccer, and then walking off the field. Based on this information, it is reasonable to assume that the camera could be panning left or right to capture their movements.", "chatgpt-answer": "B. Panning left", "video-llm-prediction": "The video shows three men walking onto a field, and then they are seen playing soccer. The men are seen running around the field, passing the ball to each other, and trying to score a goal. The video captures the excitement and energy of the game, with the men's movements and expressions conveying their passion for the sport. The field is surrounded by a large crowd of fans, who cheer and clap as the men play. The video ends with the men walking off the field, presumably after the game has ended. Overall, the video provides a thrilling and engaging experience for viewers,", "gt-answer": "D. Zooming out from three football palyers", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, there is no mention of any zooming motion. However, it is mentioned that the players are seen walking towards the center of the field and the video captures the excitement and energy of the game with the players running up and down the field. This suggests that the camera is likely following the action and moving horizontally. Therefore, the correct answer is either B. Panning left or C. Panning right.", "chatgpt-answer": "B. Panning left or C. Panning right", "video-llm-prediction": "The video shows three football players walking onto a field, with a crowd cheering them on. The players are seen walking towards the center of the field, where they begin to play. The video captures the excitement and energy of the game, with the players running up and down the field, passing the ball to each other, and scoring goals. The crowd is seen cheering and clapping throughout the video, adding to the overall atmosphere of the game. The video ends with the players walking off the field, with the crowd still cheering and clapping.", "gt-answer": "D. Zooming out from three football palyers", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera zooms in on the three football players and then pans left and right, showing the entire field. This indicates that the type of camera motion in the video is a combination of zooming in and panning left and right.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Three football players are seen walking onto a field, and the camera zooms in on them. The camera then pans left and right, showing the entire field. The players are then seen walking off the field.", "gt-answer": "D. Zooming out from three football palyers", "rating": 0 } ], "attribute_change": [ { "chatgpt-reasoning": "The video description doesn't provide any explicit information about the light condition on the football players. It only mentions the actions of the men and the crowd cheering. Therefore, there is not enough information to answer the question.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows three men walking onto a field while the crowd cheers. The men are wearing red shirts and black shorts. The video then shows the men walking onto the field while the crowd cheers. The men are seen walking around the field while the crowd cheers. The video then shows the men walking off the field while the crowd cheers. The video ends with the men walking off the field.", "gt-answer": "B. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the three men are walking onto a field, with the crowd cheering them on. Then, the men are seen walking around the field, and the crowd continues to cheer them on. Finally, the video ends with the men walking off the field. The video description does not mention anything about the light condition on the football players. Therefore, there is not enough information to answer the question.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows three men walking onto a field, with the crowd cheering them on. The men are seen walking around the field, and the crowd continues to cheer them on. The video ends with the men walking off the field.", "gt-answer": "B. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the light condition on the football players is turning darker.", "chatgpt-answer": "B. turning darker", "video-llm-prediction": "The video shows three men walking onto a field while the crowd cheers. The men are wearing red shirts and black shorts. The light condition on the football players is turning darker.", "gt-answer": "B. turning darker", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention any changes in the light condition on the football players. It only describes their actions of walking onto the field, walking around the field, and walking down the stairs. There is no information provided to determine whether the light condition is staying the same, turning darker, or turning brighter.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows three men walking onto a field while the crowd cheers. The men are seen walking around the field, and the camera pans around the stadium. The men are then seen walking down the stairs.", "gt-answer": "B. turning darker", "rating": 0 } ] }, "1080591311_reverse": { "direction": [ { "chatgpt-reasoning": "The video description explicitly mentions that the jellyfish are moving towards the right, floating upwards, and sinking downwards.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "The video showcases a group of jellyfish swimming in the ocean. The jellyfish are seen moving towards the right, floating upwards, and sinking downwards. The video captures the beauty and grace of these creatures as they move through the water.", "gt-answer": "D. sinking downwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the jellyfish is moving towards the right, then floating upwards, and finally moving towards the left.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "The video showcases a mesmerizing display of colorful jellyfish swimming in the ocean. The camera captures the jellyfish as they move towards the right, float upwards, and then move towards the left. The video highlights the beauty and grace of these aquatic creatures, making it a captivating watch for anyone interested in marine life.", "gt-answer": "D. sinking downwards", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the jellyfish are moving towards the right.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "A group of jellyfish are seen swimming in the water. They are moving towards the right.", "gt-answer": "D. sinking downwards", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the jellyfish are moving towards the right, floating upwards, and sinking downwards.", "chatgpt-answer": "A. moving towards the right", "video-llm-prediction": "The video showcases a group of jellyfish swimming in the ocean. The camera captures the movement of the jellyfish as they move towards the right, float upwards, and sink downwards. The video provides a mesmerizing view of the jellyfish and their natural behavior in the ocean.", "gt-answer": "D. sinking downwards", "rating": 0 } ] }, "3411228673_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans upwards and downwards, capturing the city's skyline and the bustling activity below. This indicates that the movement in the video is either upwards among skyscraper buildings or downwards towards the ground.", "chatgpt-answer": "B. upwards among skyscraper buildings", "video-llm-prediction": "The video showcases a cityscape with tall buildings and a busy street. The camera pans upwards and downwards, capturing the city's skyline and the bustling activity below. The video also includes a shot of a street intersection, where cars and pedestrians are visible. The consistent information is the presence of tall buildings, which are a prominent feature of the cityscape.", "gt-answer": "C. downwards towards the ground", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans upwards and downwards, capturing the bustling activity of the city. This indicates that the movement in the video is either upwards or downwards.", "chatgpt-answer": "B. upwards among skyscraper buildings", "video-llm-prediction": "The video showcases a cityscape with skyscrapers and a busy street filled with traffic. The camera pans upwards and downwards, capturing the bustling activity of the city. The video also features a bird flying over the city, adding a touch of nature to the urban landscape.", "gt-answer": "C. downwards towards the ground", "rating": 0 }, { "chatgpt-reasoning": "From the video description, it is mentioned that the camera captures the city from various angles, including a sideways view along the buildings, an upwards view among the buildings, and a downwards view towards the ground. It indicates that the camera's movement direction changes throughout the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a cityscape with a focus on the skyscraper buildings. The camera captures the city from various angles, including a sideways view along the buildings and an upwards view among the buildings. The video also features a downwards view towards the ground.", "gt-answer": "C. downwards towards the ground", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans from side to side, capturing the entire scene. This indicates a horizontal movement along the skyscraper buildings.", "chatgpt-answer": "A. sideways along the skyscraper buildings", "video-llm-prediction": "The video showcases a cityscape with a focus on the skyscraper buildings. The camera pans from side to side, capturing the entire scene. The video also includes a shot of the city from above, showcasing the buildings from a higher perspective.", "gt-answer": "C. downwards towards the ground", "rating": 0 } ] }, "1093737353_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera is performing a series of motions. It pans to the right, pans to the left, tilts up, and zooms in.", "chatgpt-answer": "A. panning to the right", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, each containing a plant. The camera pans to the right, revealing the entire series of beakers. The camera then pans to the left, revealing the entire series of beakers. The camera then tilts up, revealing the entire series of beakers. Finally, the camera zooms in, revealing the entire series of beakers.", "gt-answer": "B. panning to the left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans to the right, then zooms in on the plant, and finally pans to the left. Therefore, the camera is performing panning motion to the right and to the left, as well as zooming in.", "chatgpt-answer": "A. panning to the right or B. panning to the left", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with a plant placed in one of them. The beakers are placed on a table, and the camera pans to the right, providing a closer look at the plant in the beaker. The video then zooms in on the plant, providing a detailed view of its features. The camera then pans to the left, showcasing the other beakers and the plant in the beaker. The video ends with the camera panning to the left, providing a final view of the beakers and the plant.", "gt-answer": "B. panning to the left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans to the right, showcasing the beakers in a row. Additionally, it states that the video ends with the camera panning to the left, showcasing the entire row of beakers. Therefore, the camera is performing a panning motion, first to the right and then to the left.", "chatgpt-answer": "A. panning to the right", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with a plant placed in one of them. The beakers are placed on a table, and the camera pans to the right, showcasing the beakers in a row. The video then zooms in on the plant in the beaker, providing a close-up view of the plant's details. The video ends with the camera panning to the left, showcasing the entire row of beakers.", "gt-answer": "B. panning to the left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera is panning to the right in the first part, and then it zooms in on the plant in the second part.", "chatgpt-answer": "D. zooming in", "video-llm-prediction": "The video showcases a series of beakers filled with green liquid, with a plant placed in one of them. The beakers are placed on a table, and the camera pans to the right, providing a closer look at the plant in the beaker. The video then zooms in on the plant, providing a detailed view of its features.", "gt-answer": "B. panning to the left", "rating": 0 } ] }, "1017768724_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the person is moving in an upward, leftward, downward, and rightward direction sequentially.", "chatgpt-answer": "A. moving upwards", "video-llm-prediction": "A person is seen holding a compass in a forest. The person is moving upwards and then moves leftwards. The person then moves downwards and finally moves rightwards.", "gt-answer": "B. moving leftwards", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is moving upwards.", "chatgpt-answer": "A. moving upwards", "video-llm-prediction": "A person is seen holding a compass in a forest. The person is moving upwards, and the compass is being held in the person's right hand. The person is also wearing a watch on their left hand.", "gt-answer": "B. moving leftwards", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is moving upwards, then leftwards, downwards, and finally rightwards.", "chatgpt-answer": "D. moving rightwards", "video-llm-prediction": "A person is seen holding a compass in a forest. The person is moving upwards and then moving leftwards. The person then moves downwards and finally moves rightwards.", "gt-answer": "B. moving leftwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is holding a compass and pointing it towards the camera. The person then moves the compass around while still pointing it towards the camera. Based on this information, we can infer that the person's movement would correspond to the movement of the compass needle in relation to the camera.", "chatgpt-answer": "D. moving rightwards", "video-llm-prediction": "A person is seen holding a compass and pointing it towards the camera. The person then moves the compass around while still pointing it towards the camera. The video seems to be a demonstration of how to use a compass.", "gt-answer": "B. moving leftwards", "rating": 0 } ] }, "1100117263_reverse": { "direction": [ { "chatgpt-reasoning": "The video description does not provide any information about the direction of the little lion's motion. It only states that the little lion jumps off the lioness and runs around the field. Without any further information, it is not possible to determine the exact direction of the little lion's motion.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a lioness and her cub in a grassy field. The lioness is seen eating grass while her cub climbs on her back. The cub then jumps off the lioness and runs around the field. The lioness is seen eating grass again while her cub climbs on her back. The cub then jumps off the lioness again and runs around the field.", "gt-answer": "B. upward", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the baby lion is seen climbing on top of its mother and playing with her. Climbing on top implies a motion from a lower position to a higher position.", "chatgpt-answer": "B. upward", "video-llm-prediction": "A baby lion is seen climbing on top of its mother while she is eating grass. The baby lion is seen playing with its mother and climbing on her back. The mother lion is seen eating grass while the baby lion is playing with her. The video captures the playful and affectionate interaction between the mother and baby lion.", "gt-answer": "B. upward", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the baby lion is climbing on top of an adult lion. Since the baby lion is climbing up onto the adult lion, its motion is upward.", "chatgpt-answer": "B. upward", "video-llm-prediction": "A baby lion climbs on top of an adult lion while they both graze in the grass.", "gt-answer": "B. upward", "rating": 1 }, { "chatgpt-reasoning": "The video describes that the baby lion climbs on top of its mother and then jumps off and walks away. Based on this information, we can infer that the motion of the little lion is upward when climbing on top of its mother and then either downward or towards the camera when jumping off and walking away.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A baby lion climbs on top of its mother while she eats grass. The baby lion then jumps off and walks away.", "gt-answer": "B. upward", "rating": 0 } ] }, "1021488277_reverse": { "direction": [ { "chatgpt-reasoning": "The video description clearly states that the sequence of events is as follows: dropping down the pineapple, pushing forward the pineapple, rotating the pineapple, and picking up the pineapple.", "chatgpt-answer": "A. A person drops down the pineapple, B. A person pushes forward the pineapple, C. A person rotates the pineapple, D. A person picks up the pineapple", "video-llm-prediction": "A person drops down the pineapple, and then a person pushes forward the pineapple. After that, a person rotates the pineapple, and finally, a person picks up the pineapple.", "gt-answer": "A. A person drops down the pineapple", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions a sequence of actions involving the pineapple - dropping it down, pushing it forward, rotating it, and picking it up.", "chatgpt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "A person drops down the pineapple, and then a person pushes forward the pineapple. After that, a person rotates the pineapple, and finally, a person picks up the pineapple.", "gt-answer": "A. A person drops down the pineapple", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that a person is dropping down the pineapple.", "chatgpt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "A person drops down the pineapple.", "gt-answer": "A. A person drops down the pineapple", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states the sequence of events: dropping down the pineapple, pushing forward the pineapple, rotating the pineapple, and picking up the pineapple.", "chatgpt-answer": "A. A person drops down the pineapple", "video-llm-prediction": "A person drops down the pineapple, and then pushes forward the pineapple. Next, a person rotates the pineapple, and finally, a person picks up the pineapple.", "gt-answer": "A. A person drops down the pineapple", "rating": 1 } ] }, "1100397435_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the vacuum cleaner is seen moving towards the left side of the screen and then towards the right side of the screen. It also states that the vacuum cleaner is seen moving towards the screen and then away from the screen.", "chatgpt-answer": "D. away from the screen", "video-llm-prediction": "A robot vacuum cleaner is seen in a room, moving around and cleaning the floor. The camera captures the movements of the vacuum cleaner as it moves around the room. The vacuum cleaner is seen moving towards the left side of the screen and then towards the right side of the screen. The camera captures the movements of the vacuum cleaner as it moves around the room. The vacuum cleaner is seen moving towards the screen and then away from the screen. The camera captures the movements of the vacuum cleaner as it moves around the room. The vacuum cleaner is seen moving", "gt-answer": "B. to the left side of the screen", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the robot vacuum cleaner is initially moving towards the left side of the screen, then towards the right side of the screen, and finally towards the screen. Therefore, the correct answer is B. to the left side of the screen.", "chatgpt-answer": "B. to the left side of the screen", "video-llm-prediction": "A robot vacuum cleaner is seen in a room, moving around the floor and cleaning up dirt. The camera captures the movements of the vacuum cleaner as it moves around the room. The vacuum cleaner is seen moving towards the left side of the screen, then towards the right side of the screen, and finally towards the screen. The video showcases the cleaning capabilities of the robot vacuum cleaner, highlighting its ability to move around the room and clean up dirt.", "gt-answer": "B. to the left side of the screen", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the robot vacuum cleaner is moving towards the left side of the screen.", "chatgpt-answer": "B. to the left side of the screen", "video-llm-prediction": "A robot vacuum cleaner is seen in a room, moving towards the left side of the screen.", "gt-answer": "B. to the left side of the screen", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the robot vacuum cleaner is moving towards the left side of the screen.", "chatgpt-answer": "B. to the left side of the screen", "video-llm-prediction": "A robot vacuum cleaner is seen in a room, moving towards the left side of the screen.", "gt-answer": "B. to the left side of the screen", "rating": 1 } ] }, "1108534143_reverse": { "direction": [ { "chatgpt-reasoning": "The video description states that the puppy is seen walking into a wigwam and then walking out of it. It also mentions that the video shows the puppy staying in the wigwam. This indicates that the puppy is performing all three actions mentioned - staying in a wigwam, walking into a wigwam, and walking out of a wigwam.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "A white puppy is seen walking into a wigwam and then walking out of it. The video shows the puppy staying in the wigwam.", "gt-answer": "B. walking into a wigwam", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the puppy is seen walking into a wigwam and then walking out of it.", "chatgpt-answer": "B. walking into a wigwam", "video-llm-prediction": "A white puppy is seen walking into a wigwam and then walking out of it. The puppy is seen sitting in the wigwam and then walking out of it.", "gt-answer": "B. walking into a wigwam", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the puppy is seen walking into a wigwam and then walking out of it.", "chatgpt-answer": "C. walking out of a wigwam", "video-llm-prediction": "A white puppy is seen walking into a wigwam and then walking out of it.", "gt-answer": "B. walking into a wigwam", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the puppy is seen walking into a wigwam and then walking out of it.", "chatgpt-answer": "C. walking out of a wigwam", "video-llm-prediction": "A white puppy is seen walking into a wigwam and then walking out of it. The video captures the playful and curious nature of puppies as they explore their surroundings. The wigwam provides a cozy and safe space for the puppy to play and rest. The video is a heartwarming reminder of the joy and innocence of puppies and the love they bring into our lives.", "gt-answer": "B. walking into a wigwam", "rating": 0 } ] }, "1047368344_reverse": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the girl is running and jumping into the water, swimming in the water, and jumping out of it.", "chatgpt-answer": "A. jumping into water", "video-llm-prediction": "A girl is seen running and jumping into the water while wearing a yellow dress. She then swims in the water and jumps out of it.", "gt-answer": "D. jumping out of water", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girl is seen walking on a dock and then jumping into the water. It also states that she swims in the water and then jumps out of it. So, the girl is jumping into water, swimming in it, and then jumping out of it.", "chatgpt-answer": "A. jumping into water", "video-llm-prediction": "A girl in a yellow dress is seen walking on a dock and then jumping into the water. She swims in the water and then jumps out of it.", "gt-answer": "D. jumping out of water", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girl is seen running and jumping into the water, swimming in the water, and then jumping out of it. This indicates that the girl is performing multiple actions including jumping into the water, swimming in the water, and jumping out of it.", "chatgpt-answer": "A. jumping into water", "video-llm-prediction": "A girl in a yellow dress is seen running and jumping into the water. She then swims in the water and jumps out of it.", "gt-answer": "D. jumping out of water", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the girl is seen walking on a dock and then jumping into the water. This indicates that the girl is indeed jumping into the water.", "chatgpt-answer": "A. jumping into water", "video-llm-prediction": "A girl in a yellow dress is seen walking on a dock and then jumping into the water.", "gt-answer": "D. jumping out of water", "rating": 0 } ] }, "1050618460_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly mentions that the flowers are going through a process of turning into a full bloom.", "chatgpt-answer": "C. turning into full bloom", "video-llm-prediction": "The video showcases the process of a flower bud turning into a full bloom. The video starts with a close-up shot of a flower bud, which then transitions into a full bloom. The video then shows the flower bud turning into a full bloom, highlighting the transformation process. The video ends with a close-up shot of the flower bud, emphasizing the beginning of the process.", "gt-answer": "A. turning into buds", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the flowers go through the process of opening up, turning into full bloom, and then wilting and shrinking. Therefore, the correct answer is B. shrinking and wilting.", "chatgpt-answer": "B. shrinking and wilting", "video-llm-prediction": "The video showcases the process of a flower bud turning into a full bloom. The camera captures the buds as they begin to open up and reveal their true beauty. The video also highlights the process of the flowers wilting and shrinking, emphasizing the impermanence of all things.", "gt-answer": "A. turning into buds", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the flowers are turning into full bloom. It mentions the process of a flower bud transitioning to a full bloom flower.", "chatgpt-answer": "C. turning into full bloom", "video-llm-prediction": "The video showcases the process of flowers turning into full bloom. The video starts with a close-up shot of a flower bud, which then transitions to a full bloom flower. The video then shows the flower bud turning into a full bloom flower. The video ends with a close-up shot of the flower bud, which is now a full bloom flower.", "gt-answer": "A. turning into buds", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the flower buds are turning into full bloom flowers.", "chatgpt-answer": "C. turning into full bloom", "video-llm-prediction": "The video showcases the process of a flower bud turning into a full bloom. The video starts with a close-up shot of a flower bud, which then transitions to a full bloom flower. The video then shows the flower bud turning into a full bloom flower, highlighting the transformation process. The video ends with a close-up shot of the flower, emphasizing its beauty.", "gt-answer": "A. turning into buds", "rating": 0 } ] }, "1083113449_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the sky is getting darker. This indicates a change in the sky's appearance from a lighter color to a darker color.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The video shows a city skyline at night with a blue sky. The sky is getting darker, and the lights in the buildings are on. The video also shows a building with a blue light on it.", "gt-answer": "A. lightening up", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the sky is seen getting darker.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The video showcases a tall building with a large window, which is lit up at night. The building is surrounded by other buildings, and the sky is seen getting darker.", "gt-answer": "A. lightening up", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the sky is getting darker. This indicates that there is a change in the sky's appearance and it is becoming less bright.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The video shows a building at night with its lights on, and the sky is getting darker.", "gt-answer": "A. lightening up", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the \"sky gradually getting darker.\" Therefore, the correct answer is C. getting darker.", "chatgpt-answer": "C. getting darker", "video-llm-prediction": "The video showcases a city skyline at night, with the sky gradually getting darker. The city lights up the night sky, creating a beautiful and mesmerizing view. The video captures the city's beauty and the changing colors of the sky, making it a perfect representation of the city's nightlife.", "gt-answer": "A. lightening up", "rating": 0 } ] }, "1091143117_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly mentions that the eye is initially closed and then opens. This indicates a transition from closed to open.", "chatgpt-answer": "A. from closed to open", "video-llm-prediction": "The video shows a person's eye, which is initially closed and then opens to reveal the inside of the eye.", "gt-answer": "D. from open to closed", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the eye is initially closed and then opens to reveal the inside of the eye.", "chatgpt-answer": "A. from closed to open", "video-llm-prediction": "The video showcases a close-up of a person's eye, which is initially closed and then opens to reveal the inside of the eye. The video highlights the intricate details of the eye, including the eyelashes, eyebrow, and the pupil. The video also emphasizes the importance of eye health and hygiene, as it shows the eye being cleaned with a tissue. The video is a great resource for anyone interested in learning more about the eye and its functions.", "gt-answer": "D. from open to closed", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person's eye is initially closed and then opens, revealing the inside of the eye. This indicates a transition from closed to open.", "chatgpt-answer": "A. from closed to open", "video-llm-prediction": "The video shows a close-up of a person's eye, which is initially closed and then opens to reveal the inside of the eye.", "gt-answer": "D. from open to closed", "rating": 0 }, { "chatgpt-reasoning": "The video description suggests that the person is inserting a contact lens into their eye. This implies that the eye starts from being open, then the contact lens is inserted, and ends with the contact lens in the person's eye, indicating that the eye remains open.", "chatgpt-answer": "A. from closed to open", "video-llm-prediction": "The video showcases the process of inserting contact lenses. It starts with a close-up shot of a contact lens, followed by a person's eye. The person then inserts the contact lens into their eye, and the video ends with a close-up shot of the contact lens in the person's eye.", "gt-answer": "D. from open to closed", "rating": 0 } ] }, "1098153561_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly mentions that the leaves are changing colors from green to red, indicating a seasonal change.", "chatgpt-answer": "C. changing color from green to red", "video-llm-prediction": "The video showcases a serene forest with trees adorned in vibrant red and yellow leaves. The camera pans around the forest, capturing the beauty of the changing leaves. The video also includes a shot of a person walking through the forest, adding a sense of tranquility to the scene.", "gt-answer": "D. changing color from red to green", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the leaves are changing color from green to red and then back to green again.", "chatgpt-answer": "C. changing color from green to red", "video-llm-prediction": "The video showcases the beauty of nature as it captures the vibrant colors of leaves changing from green to red and then back to green again. The camera pans around the forest, highlighting the vibrant colors of the leaves. The video also captures the changing shape of the leaves, from flat to curled up. The serene and peaceful atmosphere of the forest is also highlighted, with the sounds of birds chirping and leaves rustling in the background. Overall, the video is a beautiful representation of the changing seasons and the beauty of nature.", "gt-answer": "D. changing color from red to green", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera captures the changing colors of the leaves. It starts with yellowing leaves and ends with green leaves, indicating a change in color from yellow to green.", "chatgpt-answer": "D. changing color from red to green", "video-llm-prediction": "The video showcases a serene forest with yellowing leaves, and the camera captures the changing colors of the leaves. The video starts with a shot of a forest with yellowing leaves, and the camera pans around the forest, capturing the changing colors of the leaves. The video ends with a shot of the forest with green leaves.", "gt-answer": "D. changing color from red to green", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the leaves are changing shape and falling off.", "chatgpt-answer": "A. changing shape and B. falling off", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves that are changing shape and falling off. The camera captures the beauty of the forest as it pans around, highlighting the changing colors of the leaves. The video provides a peaceful and calming experience for the viewer.", "gt-answer": "D. changing color from red to green", "rating": 0 } ] }, "1059072773_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the ice cream goes through multiple stages, including melting, freezing, evaporating, and solidifying.", "chatgpt-answer": "A. melting, B. freezing, C. evaporating, D. solidifying", "video-llm-prediction": "The video showcases the process of ice cream melting, freezing, evaporating, and solidifying. The video starts with a close-up shot of ice cream, which then transitions to a shot of the ice cream melting. The camera then shows the ice cream freezing, followed by a shot of the ice cream evaporating. Finally, the video ends with a shot of the ice cream solidifying.", "gt-answer": "D. solidifying", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions the different stages of ice cream, including melting, freezing, and solidifying. This suggests that the ice cream is undergoing these processes.", "chatgpt-answer": "A. melting", "video-llm-prediction": "The video showcases the process of ice cream melting, freezing, evaporating, and solidifying. The video starts with a close-up shot of ice cream, which then transitions to a shot of the ice cream melting. The camera then pans out to show the ice cream freezing, and the process repeats. The video ends with a shot of the ice cream solidifying. The video highlights the different stages of ice cream, from its melting to freezing and solidifying. The video is a great visual representation of the process of ice cream and how it", "gt-answer": "D. solidifying", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the ice cream is melting, which is supported by the observation of it melting in a circular motion and the liquid dripping off the surface. The video also states that the ice cream gradually solidifies, which indicates that it is transitioning from a solid to a liquid state.", "chatgpt-answer": "A. melting", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is shown melting in a circular motion, with the liquid dripping off the surface. The video emphasizes the process of melting and evaporating, with the ice cream gradually solidifying.", "gt-answer": "D. solidifying", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the ice cream goes through different stages, including melting, freezing, evaporating, and solidifying. Therefore, all four options are correct in this case.", "chatgpt-answer": "A. melting, B. freezing, C. evaporating, D. solidifying", "video-llm-prediction": "A video showcases the process of ice cream melting, freezing, evaporating, and solidifying. The video features a close-up shot of ice cream melting on a pink background, followed by a shot of ice cream freezing on a pink background. The video then transitions to a shot of ice cream evaporating on a pink background, and finally, a shot of ice cream solidifying on a pink background. The video highlights the different stages of ice cream, from melting to solidifying.", "gt-answer": "D. solidifying", "rating": 0 } ] }, "1093573255_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the plant is wilting initially, but then it revives and sheds leaves. Finally, it turns into buds. Therefore, all of the choices are correct because they all describe different stages of the plant's transformation.", "chatgpt-answer": "A. wilting, B. reviving, C. shedding leaves, D. turning into buds", "video-llm-prediction": "The video shows a plant in a white pot that is wilting. However, the plant is then shown reviving and shedding leaves. The plant is then shown turning into buds.", "gt-answer": "A. wilting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the plant is initially wilted and then revives, shedding leaves and turning into buds. This indicates that the plant is going through a process of wilting, reviving, shedding leaves, and turning into buds.", "chatgpt-answer": "All of the above options are correct", "video-llm-prediction": "The video showcases a plant that is initially wilted and then revives, shedding leaves and turning into buds.", "gt-answer": "A. wilting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the plant is wilting initially, then it starts to revive and shed its leaves. Finally, the plant turns into buds.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "A plant is shown in a white pot, and it is wilting. However, it starts to revive and shed its leaves. The plant then turns into buds.", "gt-answer": "A. wilting", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the plant is wilting, reviving, shedding its leaves, and turning into buds.", "chatgpt-answer": "A. wilting, B. reviving, C. shedding leaves, D. turning into buds", "video-llm-prediction": "A plant is seen in a white pot, with its leaves turning into buds. The plant is wilting, but then it starts to revive. The plant is shedding its leaves, but it is turning into buds.", "gt-answer": "A. wilting", "rating": 0 } ] }, "1077146132_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the woman is opening and closing the curtains. Opening the curtains would let more light into the room, while closing the curtains would block out the light. Therefore, the video is likely turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "A woman is seen standing in front of a window, opening and closing the curtains. She then lays down on the bed and continues to open and close the curtains.", "gt-answer": "B. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is opening the curtains and letting the sunlight in. This implies that more light is entering the room, which would result in the scene turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "A woman is seen standing in front of a window, opening the curtains and letting the sunlight in. She then lays down on the bed and closes her eyes, enjoying the warmth of the sun.", "gt-answer": "B. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is opening the curtains and letting the sunlight in. This suggests that the video is turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "A woman is seen standing in front of a window, opening the curtains and letting the sunlight in. She then lays down on the bed and closes her eyes.", "gt-answer": "B. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is opening the curtains and letting the sunlight in. This implies that the brightness in the room is increasing, so the answer should be C. turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "A woman is seen standing in front of a window, opening the curtains and letting the sunlight in. She then lays down on the bed and closes her eyes, enjoying the warmth of the sun.", "gt-answer": "B. turning darker", "rating": 0 } ] }, "1086688682_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the traffic light changes from red to green and then back to red again.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "The video shows a traffic light that changes from red to green, and then back to red again. The video also includes a shot of a building with a traffic light in front of it.", "gt-answer": "D. From green to red", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the traffic light changes from red to green and then back to red again.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "The video showcases a traffic light that changes from red to green, and then back to red again. The camera captures the light from different angles, highlighting its movement and color changes. The video emphasizes the importance of obeying traffic signals and the consequences of not doing so.", "gt-answer": "D. From green to red", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the change happening to the traffic lights is from red to green.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "A traffic light is shown in the video, and it changes from red to green.", "gt-answer": "D. From green to red", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the traffic light changes from red to green.", "chatgpt-answer": "A. From red to green", "video-llm-prediction": "A traffic light is shown in the video, and it changes from red to green.", "gt-answer": "D. From green to red", "rating": 0 } ] }, "1099738787_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the concrete wall is melting and falling apart, as well as being assembled together.", "chatgpt-answer": "B. falling apart", "video-llm-prediction": "The video shows a concrete wall that is melting and falling apart. The wall is shown in different stages of disintegration, with pieces of concrete falling off and the wall crumbling. The video also shows the wall being assembled together, with the pieces of concrete being put back into place. The video provides a detailed look at the process of the wall's disintegration and reassembly.", "gt-answer": "C. assembling together", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the concrete wall is initially melting and falling apart, but then it is shown assembling together.", "chatgpt-answer": "C. assembling together", "video-llm-prediction": "The video showcases a concrete wall that is melting and falling apart. The wall is then shown assembling together, and the video ends with the wall still standing.", "gt-answer": "C. assembling together", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the concrete wall is melting and falling apart at first, and then it shows the same wall being assembled together.", "chatgpt-answer": "C. assembling together", "video-llm-prediction": "A video showcases a concrete wall that is melting and falling apart. The video then shows the same wall being assembled together.", "gt-answer": "C. assembling together", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the concrete wall is shown melting and falling apart, then assembling together. Both choices B and C are mentioned in the video description.", "chatgpt-answer": "B. falling apart", "video-llm-prediction": "A concrete wall is shown melting and falling apart, then assembling together.", "gt-answer": "C. assembling together", "rating": 0 } ] }, "1094219575_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the flower is shown blooming and wilting, indicating that the flowers are going through a process of blooming and wilting.", "chatgpt-answer": "C. blooming and D. wilting", "video-llm-prediction": "The video showcases a beautiful white flower that is initially shown in a close-up shot. The flower is then shown in various positions, including a close-up shot of the flower blooming and a shot of the flower wilting. The video highlights the beauty and delicate nature of the flower, with a focus on its changing colors and growth.", "gt-answer": "C. blooming", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the flowers are seen in different stages of blooming and highlights their wilting as well. This indicates that the flowers are going through the process of blooming and eventually wilting.", "chatgpt-answer": "C. blooming and D. wilting", "video-llm-prediction": "The video showcases a beautiful white flower that is captured from various angles. The flower is seen in different stages of blooming, from its initial stages to its full bloom. The video also highlights the flower's wilting, which adds a sense of impermanence to the beauty of the flower. The video is a visual treat for anyone who appreciates the beauty of flowers.", "gt-answer": "C. blooming", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the flower is initially closed and then blooms, revealing its beauty. This indicates that the flowers are blooming.", "chatgpt-answer": "C. blooming", "video-llm-prediction": "The video showcases a flower that is initially closed and then blooms, revealing its beauty. The flower is shown in various stages of growth, from a bud to a fully bloomed flower. The video highlights the process of the flower's growth and the beauty of the final product.", "gt-answer": "C. blooming", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the white flower is blooming, which means it is opening up and showcasing its beauty.", "chatgpt-answer": "C. blooming", "video-llm-prediction": "A white flower blooms in a black background, showcasing its beauty.", "gt-answer": "C. blooming", "rating": 1 } ] }, "1067427023_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the snow particles are solidifying, melting, and scattering.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a close-up of snow particles, which are then seen melting and scattering. The snow particles are shown to be solidifying, melting, and scattering in the video.", "gt-answer": "A. solidifying", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the snow particles are solidifying, melting, and scattering. However, it only describes the transformation happening to the snow particles and does not mention any other process such as solidifying or scattering. Therefore, the best term to describe the transformation happening to the snow particles is \"melting.\"", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of snow melting and scattering. The camera captures the snow particles as they solidify, melt, and scatter. The sound of the melting snow adds to the immersive experience. The video provides a close-up view of the snow particles, allowing the viewer to appreciate the beauty of the melting process. The video is a perfect representation of the natural process of snow melting and scattering.", "gt-answer": "A. solidifying", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the snow particles begin to solidify, which means they are changing from a liquid state to a solid state.", "chatgpt-answer": "A. solidifying", "video-llm-prediction": "The video shows a close-up of snow particles, which then begin to solidify. The camera then pans out to show the snow particles scattered around.", "gt-answer": "A. solidifying", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the snow particles are solidifying, melting, and scattering. While all three terms are mentioned, the description emphasizes the transformation happening to the snow particles, indicating that the best term to describe this transformation is \"melting.\"", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of snow melting and scattering on the ground. The camera captures the snow particles as they solidify, melt, and scatter. The video provides a close-up view of the snow particles, highlighting their transformation from solid to liquid and back to solid again. The sound of the melting snow adds to the immersive experience, creating a calming and soothing atmosphere. The video is a perfect representation of the beauty and tranquility of snowy landscapes.", "gt-answer": "A. solidifying", "rating": 0 } ] }, "1093948229_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the substance is seen melting, shrinking, and spinning before finally exploding. Therefore, the correct answer is D. exploding.", "chatgpt-answer": "D. exploding", "video-llm-prediction": "The video showcases the process of a substance being poured into water and then exploding. The substance is seen melting, shrinking, and spinning before finally exploding. The video provides a detailed look at the process of the substance's transformation.", "gt-answer": "B. shrinking", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the golden particles are seen melting and shrinking. Additionally, it mentions that the particles explode.", "chatgpt-answer": "A. melting, B. shrinking, D. exploding", "video-llm-prediction": "The video showcases a close-up of golden particles, which then proceed to spin rapidly before exploding. The particles are seen melting and shrinking in the process. The video captures the particles in various stages of their life cycle, from their initial formation to their eventual destruction. The sound of the particles exploding adds to the immersive experience of the video. Overall, the video provides a mesmerizing display of the particles' behavior and their eventual demise.", "gt-answer": "B. shrinking", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the golden particles are melting, shrinking, spinning, and exploding.", "chatgpt-answer": "A. melting, B. shrinking, C. spinning, D. exploding", "video-llm-prediction": "A video showcasing the melting, shrinking, spinning, and exploding of golden particles.", "gt-answer": "B. shrinking", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the golden particles are seen melting, shrinking, and spinning. It also mentions that the particles then explode, creating a display of golden sparks. Therefore, all of the mentioned actions (melting, shrinking, spinning, and exploding) are happening to the golden particles.", "chatgpt-answer": "All of the choices are correct.", "video-llm-prediction": "The video showcases a pile of golden particles that are seen melting, shrinking, and spinning. The particles then explode, creating a spectacular display of golden sparks. The video captures the beauty and power of the golden particles as they transform and interact with each other.", "gt-answer": "B. shrinking", "rating": 0 } ] }, "1049965795_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions several actions happening to the light bulb - turning off, breaking, lighting up, and rapidly changing color. Therefore, the correct answer is D. rapidly changing color.", "chatgpt-answer": "D. rapidly changing color", "video-llm-prediction": "A light bulb is shown in a dark room, and it is turned off. The light bulb is then shown breaking, and it is lit up. The light bulb is then shown rapidly changing color.", "gt-answer": "A. turning off", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the light bulb starts with dimness and gradually brightens until it reaches its full brightness. It also mentions that the light bulb then begins to rapidly change colors. None of the choices accurately describe this sequence of events.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A dimly lit room features a single light bulb that is turned on and begins to glow. The light bulb gradually brightens until it reaches its full brightness. The light bulb then begins to rapidly change colors, creating a mesmerizing visual effect. The video captures the transformation of the light bulb, from its initial dimness to its full brightness and colorful display.", "gt-answer": "A. turning off", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the light bulb is turned off. None of the other choices can be inferred from the given information.", "chatgpt-answer": "A. turning off", "video-llm-prediction": "A light bulb is shown in a dark room, and it is turned off.", "gt-answer": "A. turning off", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the light bulb is turned off initially, but then it turns on and starts rapidly changing colors. None of options A, B, or C accurately describe this change in behavior. Option D, \"rapidly changing color,\" is the only choice that matches the description provided.", "chatgpt-answer": "D. rapidly changing color", "video-llm-prediction": "A light bulb is shown in a dark room, and it is turned off. The light bulb then turns on and begins to rapidly change colors.", "gt-answer": "A. turning off", "rating": 0 } ] }, "1052364490_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the digital bar chart starts with a small size and gradually increases in size.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video shows a digital bar chart that starts with a small size and gradually increases in size. The video also includes a blue digital bar chart that starts with a small size and gradually increases in size.", "gt-answer": "C. decreasing", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the digital bar chart starts small and gradually increases in size. Therefore, the correct answer is B. increasing.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video features a digital bar chart that starts small and gradually increases in size. The chart is shown in a blue color, and the video provides a close-up view of the chart. The video also features a digital graph that is shown in a blue color and features a line graph. The video ends with a digital bar chart that starts small and gradually increases in size.", "gt-answer": "C. decreasing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the digital bar chart is increasing in size.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "A digital bar chart is shown, and it increases in size.", "gt-answer": "C. decreasing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the digital bar chart starts with a small size and gradually increases in size. It also mentions that the chart is shown in a blue color, and the video ends with the same size as it started. Therefore, the correct answer is B. increasing as the bar chart grows in size throughout the video.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video features a digital bar chart that starts with a small size and gradually increases in size. The chart is shown in a blue color, and the video ends with the same size as it started.", "gt-answer": "C. decreasing", "rating": 0 } ] }, "1080990179_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the apple is being cut in half. There is no indication of the apple shrinking, drying out, or growing bigger.", "chatgpt-answer": "A. being cut", "video-llm-prediction": "The video starts with a close-up shot of an apple, and then it shows the apple being cut in half. The camera then zooms in on the apple, and it is seen drying out and shrinking. The video ends with the apple being cut in half again. The information that is consistent with the video is that the apple is being cut in half. The other information is not relevant to the video content.", "gt-answer": "C. growing bigger", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the process being showcased is of an apple being cut open and revealing its insides. The camera zooms in on the apple, highlighting its texture and color, and then transitions to a close-up shot of the apple's insides, revealing the seeds and other internal structures. This indicates that the apple is being cut.", "chatgpt-answer": "A. being cut", "video-llm-prediction": "The video showcases the process of an apple being cut open and revealing its insides. The camera zooms in on the apple, highlighting its texture and color. The video then transitions to a close-up shot of the apple's insides, revealing the seeds and other internal structures. The camera then zooms out, providing a broader perspective of the apple. The video emphasizes the apple's growth and development, from its initial stages to its final form. The video also highlights the apple's texture and color, emphasizing its natural beauty. Overall, the video provides a detailed", "gt-answer": "C. growing bigger", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the apple is being cut in half and then drying out and shrinking.", "chatgpt-answer": "B. shrinking and drying out", "video-llm-prediction": "The video shows an apple being cut in half, revealing the inside of the fruit. The apple is then shown drying out and shrinking.", "gt-answer": "C. growing bigger", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the apple is being cut in half and then the inside of the apple is shown drying out and shrinking.", "chatgpt-answer": "B. shrinking and drying out", "video-llm-prediction": "The video shows an apple being cut in half, revealing the inside of the fruit. The inside of the apple is then shown drying out and shrinking.", "gt-answer": "C. growing bigger", "rating": 0 } ] }, "1077575504_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the pile of salt is being poured into a bowl and then poured into a sieve. It also states that the salt is then poured back into a bowl. These actions suggest that the salt is being moved or transferred, but it does not provide any information about its size changing, melting, or disappearing completely.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a pile of salt being poured into a bowl and then being poured into a sieve. The salt is then poured into a bowl and the video ends with a close-up of the salt.", "gt-answer": "D. disappearing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the pile of salt starts to scatter, continues to grow, and eventually melts. Finally, it disappears. This implies a sequence of events where the salt scatters, grows, melts, and then disappears.", "chatgpt-answer": "D. disappearing", "video-llm-prediction": "A pile of salt is shown, and it starts to scatter. The salt continues to grow, and eventually, it melts. The pile of salt eventually disappears.", "gt-answer": "D. disappearing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the pile of salt starts to scatter, then grows, and eventually melts. Finally, the video ends with the pile of salt disappearing. This indicates a clear sequence of events, starting with scattering, then growing, followed by melting, and ultimately disappearing.", "chatgpt-answer": "D. disappearing", "video-llm-prediction": "A pile of salt is shown, and it starts to scatter. The salt then grows, and it eventually melts. The video ends with the pile of salt disappearing.", "gt-answer": "D. disappearing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the pile of salt begins to scatter, continues to grow, starts to melt, and eventually disappears.", "chatgpt-answer": "D. disappearing", "video-llm-prediction": "A pile of salt is shown, and it begins to scatter. The salt continues to grow, and eventually, it starts to melt. The pile of salt eventually disappears.", "gt-answer": "D. disappearing", "rating": 1 } ] }, "23370985_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the ice is melting and shattering. Choice A, freezing, is not consistent with the video description. Choice B, melting, is consistent with the video description. Choice C, shattering, is also consistent with the video description.", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of ice melting and shattering. The first piece of information, A, describes the ice crystal as freezing, which is consistent with the video. The second piece of information, B, describes the ice crystal as melting, which is also consistent with the video. The third piece of information, C, describes the ice crystal as shattering, which is not consistent with the video.", "gt-answer": "B. melting", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the ice crystal is transforming from a solid to a liquid state, highlighting the process of melting. Additionally, it mentions that the ice shatters, indicating the process of shattering is also occurring.", "chatgpt-answer": "B. melting", "video-llm-prediction": "The video showcases the process of ice melting and shattering, with a focus on the ice crystal's transformation from a solid to a liquid state. The video begins with a close-up shot of a single ice crystal, which then transitions to a series of shots displaying the ice melting and shattering. The camera captures the ice crystal's transformation from a solid to a liquid state, highlighting the ice's melting process. The video also emphasizes the ice's shattering, capturing the ice's sudden breakage into smaller pieces. The video'", "gt-answer": "B. melting", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the ice crystals are shattering.", "chatgpt-answer": "C. shattering", "video-llm-prediction": "A close-up shot of ice crystals is shown, and they begin to shatter.", "gt-answer": "B. melting", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the ice crystals are seen freezing, melting, and shattering in a visually appealing manner. This suggests that all three actions - freezing, melting, and shattering - are happening to the ice crystals.", "chatgpt-answer": "A. freezing, B. melting, C. shattering", "video-llm-prediction": "The video showcases the process of ice melting and shattering. The ice crystals are seen freezing, melting, and shattering in a visually appealing manner. The video captures the transformation of the ice crystals from solid to liquid and then to shattered pieces. The sound of the ice shattering adds to the immersive experience. The video is perfect for those who enjoy watching the beauty of nature's transformation.", "gt-answer": "B. melting", "rating": 0 } ] }, "1055981522_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the 3D shapes change in appearance and specifically mentions that they start as cubes and then turn into triangles before finally turning into spheres.", "chatgpt-answer": "B. turning into triangles", "video-llm-prediction": "The video showcases a series of 3D shapes that change in appearance. The shapes start as cubes and then turn into triangles before finally turning into spheres. The video is a visual representation of the changing nature of 3D shapes.", "gt-answer": "D. turning into cubes", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the 3D shapes are changing in appearance and turning into triangles, spheres, and cubes.", "chatgpt-answer": "B. turning into triangles", "video-llm-prediction": "The video showcases a series of 3D shapes that change in appearance, turning into triangles, spheres, and cubes. The video starts with a single shape, which then morphs into several other shapes, creating a visually captivating experience. The video's focus is on the transformation of the shapes, highlighting the intricate details and the fluidity of the changes. The video's visuals are complemented by the use of different colors and textures, adding depth and complexity to the shapes. Overall, the video is a mesmerizing display of 3D shape transformation, leaving the", "gt-answer": "D. turning into cubes", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the 3D shapes are disappearing and turning into triangles, spheres, and cubes.", "chatgpt-answer": "A. disappearing", "video-llm-prediction": "A video showcasing 3D shapes that disappear and turn into triangles, spheres, and cubes.", "gt-answer": "D. turning into cubes", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the shapes are transformed into different shapes, including triangles, spheres, and cubes. This implies that the shapes are not disappearing, but rather changing into different forms.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases various 3D shapes that are shown in different colors and sizes. The shapes are then transformed into different shapes, including triangles, spheres, and cubes. The video ends with the shapes disappearing.", "gt-answer": "D. turning into cubes", "rating": 0 } ] }, "1081734740_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the leaf is changing its color from green to yellow and then back to green. Therefore, the correct answer is A - It is turning from green to yellow.", "chatgpt-answer": "A. It is turning from green to yellow", "video-llm-prediction": "The video showcases the natural process of a leaf changing its color from green to yellow. The video starts with a close-up shot of a leaf, and then it transitions to a shot of the same leaf turning yellow. The video then shows the same leaf turning green again. The video emphasizes the natural process of a leaf changing its color and the beauty of nature.", "gt-answer": "D. It is turning from yellow to green", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the leaves are seen in various stages of change, from green to yellow and white. This suggests that the texture of the leaf is changing as it transitions in color.", "chatgpt-answer": "A. It is turning from green to yellow", "video-llm-prediction": "The video showcases the natural beauty of leaves changing colors. The leaves are seen in various stages of change, from green to yellow and white. The video highlights the intricate patterns and textures of the leaves, which are a testament to the beauty of nature. The video is a visual treat for anyone who appreciates the beauty of nature.", "gt-answer": "D. It is turning from yellow to green", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the leaf is turning from green to yellow.", "chatgpt-answer": "A. It is turning from green to yellow", "video-llm-prediction": "A leaf is shown in the video, and it is turning from green to yellow.", "gt-answer": "D. It is turning from yellow to green", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the leaves are seen in various stages of change, from green to yellow and white. This indicates that the texture of the leaf is changing from green to yellow.", "chatgpt-answer": "A. It is turning from green to yellow", "video-llm-prediction": "The video showcases the natural beauty of leaves changing colors. The leaves are seen in various stages of change, from green to yellow and white. The video provides a close-up view of the leaves, highlighting their intricate texture and vibrant colors. The video is a perfect representation of the beauty of nature and the changing seasons.", "gt-answer": "D. It is turning from yellow to green", "rating": 0 } ] }, "1093719871_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the pink flowers are initially withered and dying, but as the video progresses, they start to grow taller and blossom. Then, the video shows a close-up shot of the flowers turning from withered to full blossom. Finally, the video ends with the flowers turning from full blossom to withered.", "chatgpt-answer": "C. turning from withered to full blossom", "video-llm-prediction": "The video showcases a bunch of pink flowers that are initially withered and dying. However, as the video progresses, the flowers start to grow taller and blossom. The flowers are then shown in a close-up shot, and they are seen turning from withered to full blossom. The video ends with the flowers turning from full blossom to withered.", "gt-answer": "D. turning from full blossom to withered", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the flowers are initially shown in a withered state but then grow taller and eventually turn into full blossoms. This indicates that the flowers are undergoing a transformation from their withered state to their full bloom.", "chatgpt-answer": "C. turning from withered to full blossom", "video-llm-prediction": "The video showcases a beautiful display of pink flowers, which are initially shown in a withered state. However, as the video progresses, the flowers start to grow taller and eventually turn into full blossoms. The video captures the natural process of the flowers' growth and transformation, from their initial state to their full bloom. The viewer can appreciate the beauty and grace of the flowers as they grow and change throughout the video.", "gt-answer": "D. turning from full blossom to withered", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the pink flowers are growing taller and turning from withered to full blossom.", "chatgpt-answer": "C. turning from withered to full blossom", "video-llm-prediction": "The video showcases the process of pink flowers growing taller and turning from withered to full blossom. The video starts with a close-up shot of pink flowers, and then it transitions to a wider shot of the flowers. The flowers are shown growing taller and turning from withered to full blossom. The video ends with a shot of the flowers turning from full blossom to withered.", "gt-answer": "D. turning from full blossom to withered", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the flowers are seen growing taller, turning from withered to full blossom, and turning from full blossom to withered.", "chatgpt-answer": "A. growing taller, C. turning from withered to full blossom, D. turning from full blossom to withered", "video-llm-prediction": "The video showcases a beautiful display of pink flowers in various stages of blossom. The flowers are seen growing taller and turning from withered to full blossom. The video also captures the flowers turning from full blossom to withered. The video highlights the beauty of nature and the different stages of the flowers' life cycle.", "gt-answer": "D. turning from full blossom to withered", "rating": 0 } ] }, "1055973887_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the fire ball is shown getting smaller and larger, but it also mentions that there is an instance where the fire ball stays the same size.", "chatgpt-answer": "A. staying the same size", "video-llm-prediction": "A fire ball is shown in the video, and it is seen getting smaller and larger. The fire ball is the subject of the video, and it is seen staying the same size in one instance.", "gt-answer": "B. getting smaller", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is initially the same size and then gradually gets smaller before getting larger again.", "chatgpt-answer": "C. getting larger", "video-llm-prediction": "The video shows a large fire ball that is initially the same size and then gradually gets smaller before getting larger again.", "gt-answer": "B. getting smaller", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the fire ball is seen getting smaller and larger, indicating that its size is changing.", "chatgpt-answer": "C. getting larger", "video-llm-prediction": "A fire ball is shown in the video, and it is seen getting smaller and larger. The fire ball is the only consistent element in the video.", "gt-answer": "B. getting smaller", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the fire ball is seen getting larger and smaller.", "chatgpt-answer": "C. getting larger", "video-llm-prediction": "A fire ball is shown in the video, and it is seen getting larger and smaller. The fire ball is the subject of the video, and it is the only information that matches the content of the video.", "gt-answer": "B. getting smaller", "rating": 0 } ] }, "1098710341_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the glass is being filled and then emptied. This implies that the glass is going from full of water to empty.", "chatgpt-answer": "B. It is going from full of water to empty", "video-llm-prediction": "The video shows a glass of water being filled and then emptied. The glass is shown in different positions, including on a table and in a hand. The video also includes a shot of a person pouring water into the glass.", "gt-answer": "B. It is going from full of water to empty", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the glass is being filled with water and then drained, indicating a transition from full of water to empty.", "chatgpt-answer": "B. It is going from full of water to empty", "video-llm-prediction": "The video shows a glass being filled with water and then drained. The glass is shown in different positions, including on a table and in a hand. The video also includes a close-up shot of the glass.", "gt-answer": "B. It is going from full of water to empty", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the glass is shown changing from full to empty and back again. This implies that the glass is going from full of water to empty and then going back to being full of water.", "chatgpt-answer": "C. It is going from empty to full of water", "video-llm-prediction": "The video shows a glass of water being filled and then emptied. The glass is shown changing from full to empty and back again.", "gt-answer": "B. It is going from full of water to empty", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the glass is being filled with water and then being drained. Therefore, the correct answer is B. It is going from full of water to empty.", "chatgpt-answer": "B. It is going from full of water to empty", "video-llm-prediction": "The video shows a glass being filled with water and then being drained. The glass is shown in different positions, including being held by a person and sitting on a table. The video also includes a close-up shot of the glass.", "gt-answer": "B. It is going from full of water to empty", "rating": 1 } ] }, "1099116143_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description explicitly states that the pink liquid is freezing. There is no mention of white foam appearing or disappearing, so choices A and B can be eliminated. Additionally, there is no information provided about the liquid evaporating, so choice D can also be eliminated.", "chatgpt-answer": "C. It is freezing", "video-llm-prediction": "The video features a close-up shot of a pink liquid in a glass, which is then shown freezing and evaporating. The video also includes a piece of information that suggests the pink liquid is freezing.", "gt-answer": "A. White foam disappears from the surface", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the pink liquid is observed to be freezing and evaporating.", "chatgpt-answer": "D. It is evaporating", "video-llm-prediction": "The video showcases a close-up of a pink liquid, which is then observed to be freezing and evaporating. The video captures the transformation of the liquid, from its initial state to the final outcome. The video highlights the process of freezing and evaporating, which is a fascinating natural phenomenon. The video is a great example of the beauty of nature and the power of science.", "gt-answer": "A. White foam disappears from the surface", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions several events happening to the pink liquid, including the white foam disappearing and reappearing on the surface, freezing, and evaporating.", "chatgpt-answer": "A. White foam disappears from the surface, B. White foam appears on the surface, C. It is freezing, and D. It is evaporating.", "video-llm-prediction": "A pink liquid is shown in a video, and it is observed that the white foam disappears from the surface. Later, the white foam appears on the surface. The pink liquid is then observed to be freezing, and it is also observed to be evaporating.", "gt-answer": "A. White foam disappears from the surface", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the pink liquid is observed to have white foam on its surface, and it is seen to be freezing and evaporating. This indicates that the white foam appears on the surface (choice B) and the liquid is both freezing (choice C) and evaporating (choice D).", "chatgpt-answer": "B. White foam appears on the surface", "video-llm-prediction": "The video showcases a pink liquid that is being observed through a microscope. The liquid is seen to be freezing and evaporating, and it is observed to have white foam on its surface.", "gt-answer": "A. White foam disappears from the surface", "rating": 0 } ] }, "1025623079_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the skyscraper is in the process of being constructed. However, towards the end of the video, it is shown collapsing.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "The video shows a skyscraper that is in the process of being constructed. The building is seen growing taller and taller as it is being built. However, towards the end of the video, the building is shown collapsing. The information that is consistent with the video is that the building is in the process of being constructed.", "gt-answer": "B. growing taller", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the skyscraper is in the process of collapsing.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "A skyscraper is shown in the video, and it is in the process of collapsing. The building is seen growing taller and then collapsing in the end. The video captures the moment when the building is in construction, and it is shown in the process of collapsing.", "gt-answer": "B. growing taller", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the skyscraper is growing taller initially, but it collapses in the end.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "A skyscraper is shown in the video, and it is growing taller. However, it collapses in the end.", "gt-answer": "B. growing taller", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the skyscraper is in the process of collapsing.", "chatgpt-answer": "D. collapsing", "video-llm-prediction": "A skyscraper is shown in the video, and it is in the process of collapsing. The building is seen growing taller and then collapsing.", "gt-answer": "B. growing taller", "rating": 0 } ] }, "1063373449_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the coronavirus is seen replicating itself, mutating into a new strain, assembling together, and then being attacked by antibodies, causing it to dissolve. Hence, all of the choices are correct.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "The video showcases the replication of the coronavirus, which is mutating into a new strain. The virus is seen assembling together and then being attacked by antibodies, causing it to dissolve.", "gt-answer": "C. assembling together", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the coronavirus is replicating and mutating, as well as assembling and dissolving under the attack of antibodies.", "chatgpt-answer": "A. replicating itself, B. mutating into a new strain, C. assembling together, D. dissolving under the attack of antibodies", "video-llm-prediction": "The video showcases the replication and mutation of the coronavirus, as well as its ability to assemble and dissolve under the attack of antibodies.", "gt-answer": "C. assembling together", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the coronavirus is replicating itself, mutating into a new strain, and assembling together. Additionally, it mentions that the coronavirus is being attacked by antibodies, causing it to dissolve.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "The video shows the process of the coronavirus replicating itself, mutating into a new strain, and assembling together. The video also shows the coronavirus being attacked by antibodies, causing it to dissolve.", "gt-answer": "C. assembling together", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the coronavirus is replicating and mutating, as well as undergoing assembly and dissolution under the attack of antibodies.", "chatgpt-answer": "A. replicating itself, B. mutating into a new strain, C. assembling together, D. dissolving under the attack of antibodies", "video-llm-prediction": "The video showcases the replication and mutation of the coronavirus, as well as its ability to assemble and dissolve under the attack of antibodies.", "gt-answer": "C. assembling together", "rating": 0 } ] }, "1062609286_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the battery charge indicator starts at 100% and gradually decreases to 0%. This indicates that the battery charge is decreasing.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "The video shows a battery charge indicator with a blue background and white text. The indicator starts at 100% and gradually decreases to 0%.", "gt-answer": "A. decreasing", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the battery charge percentage starts at 100% and gradually decreases, then stays constant, and finally increases. This indicates a change in the battery charge over time.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "The video displays a battery charge indicator with a blue background and white text. The indicator shows the battery charge percentage, which starts at 100% and gradually decreases. The video also shows the battery charge indicator with a green background and white text, which shows the battery charge percentage staying constant. Additionally, the video displays the battery charge indicator with a red background and white text, which shows the battery charge percentage increasing.", "gt-answer": "A. decreasing", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the car's battery charge is decreasing.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "A car's battery charge is shown in a video, and it is decreasing.", "gt-answer": "A. decreasing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the car's battery charge starts at 100% and gradually decreases to 80%. This indicates that the battery charge is decreasing.", "chatgpt-answer": "A. decreasing", "video-llm-prediction": "The video showcases a car's battery charge, which starts at 100% and gradually decreases to 80%. The video also highlights the importance of maintaining a battery's charge.", "gt-answer": "A. decreasing", "rating": 1 } ] }, "1060403198_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the tree has green leaves which gradually change to brown and shed their leaves. This indicates that the tree is changing color and shedding its leaves.", "chatgpt-answer": "D. changing color", "video-llm-prediction": "The video showcases a tree with green leaves, which gradually change to brown and shed their leaves. The tree is shown in different positions, including a close-up of its branches and a wider shot of the tree in a field. The video also includes a shot of a person standing in front of the tree.", "gt-answer": "B. decreasing height", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the tree starts off small and gradually grows taller. It also mentions that the leaves fall off the tree, indicating that the tree is shedding its leaves. These details suggest that the correct answer should be a combination of increasing height (A) and shedding leaves (C).", "chatgpt-answer": "A. increasing height, C. shedding leaves", "video-llm-prediction": "The video showcases a tree with green leaves, which gradually change to brown as the seasons progress. The tree is initially small and bare, but it gradually grows taller and taller. The leaves fall off the tree, and the tree becomes bare again. The video provides a visual representation of the tree's growth and seasonal changes.", "gt-answer": "B. decreasing height", "rating": 0 }, { "chatgpt-reasoning": "The video describes that the tree is growing taller, shedding leaves, and changing color.", "chatgpt-answer": "A. increasing height, C. shedding leaves, D. changing color", "video-llm-prediction": "A tree is shown in the video, and it is seen growing taller and taller. The leaves are also shedding, and the tree is changing color.", "gt-answer": "B. decreasing height", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the tree is changing colors, shedding leaves, and growing taller. Therefore, options A, B, and C are all correct.", "chatgpt-answer": "A. increasing height, C. shedding leaves", "video-llm-prediction": "A tree is shown in the video, and it is seen changing colors and shedding leaves. The video also shows the tree growing taller and taller.", "gt-answer": "B. decreasing height", "rating": 0 } ] }, "1099109715_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that there is a variety of fruits and vegetables, including tomatoes, blueberries, and peppers. It does not mention anything about the fruits and vegetables becoming rotten or staying the same. The emphasis of the video is on the importance of consuming a variety of them for a healthy diet, which suggests that the number of fruits and vegetables is likely increasing.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, blueberries, and peppers. The tomatoes are shown in a bowl, while the blueberries and peppers are displayed on a table. The video emphasizes the importance of consuming a variety of fruits and vegetables for a healthy diet. The video also highlights the potential negative effects of consuming too much of certain fruits and vegetables. Overall, the video provides a helpful reminder to maintain a balanced diet and to be mindful of the foods we consume.", "gt-answer": "C. decreasing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that a variety of fruits and vegetables are showcased, including tomatoes, blueberries, and peppers. This indicates that the number of fruits and vegetables is increasing as different types are being displayed.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, blueberries, and peppers. The tomatoes are shown in a bowl, while the blueberries and peppers are displayed on a table. The video emphasizes the importance of consuming a diverse range of fruits and vegetables for a healthy diet.", "gt-answer": "C. decreasing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video showcases a variety of fruits and vegetables. It also highlights the benefits of incorporating these foods into one's daily routine, which suggests that it promotes the consumption of fruits and vegetables.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, blueberries, and peppers. The video emphasizes the importance of consuming a diverse range of fruits and vegetables for a healthy diet. The video also highlights the benefits of incorporating these foods into one's daily routine.", "gt-answer": "C. decreasing", "rating": 0 }, { "chatgpt-reasoning": "The video showcases a variety of fruits and vegetables, including tomatoes, blueberries, and peppers. It mentions that the video emphasizes the importance of consuming a variety of fruits and vegetables for a healthy diet. From this information, we can infer that the number of fruits and vegetables is increasing.", "chatgpt-answer": "B. increasing", "video-llm-prediction": "The video showcases a variety of fruits and vegetables, including tomatoes, blueberries, and peppers. The tomatoes are shown in different positions, including on a table and in a bowl. The blueberries are also displayed in a bowl, and the peppers are shown in a bowl and on a table. The video emphasizes the importance of consuming a variety of fruits and vegetables for a healthy diet.", "gt-answer": "C. decreasing", "rating": 0 } ] }, "1051211272_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the toast with cream cheese is being gradually eaten out and disappearing.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "The video shows a piece of toast with cream cheese being gradually eaten out and disappearing. The toast is shown in different positions, including on a wooden table and a cutting board. The video also includes a close-up shot of the toast with cream cheese.", "gt-answer": "A. gradually reappearing piece by piece", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sandwich with cream cheese is gradually being eaten out and disappearing.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "The video showcases a close-up of a sandwich with cream cheese on top, which is gradually being eaten out and disappearing. The sandwich is made with bread and cream cheese, and it is placed on a wooden table. The video also includes a shot of a leafy green plant, which is not related to the sandwich.", "gt-answer": "A. gradually reappearing piece by piece", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the toast with cream cheese is gradually reappearing piece by piece.", "chatgpt-answer": "A. gradually reappearing piece by piece", "video-llm-prediction": "A piece of toast with cream cheese is shown, and it gradually reappears piece by piece.", "gt-answer": "A. gradually reappearing piece by piece", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the sandwich is being cut into four pieces and eaten. This implies that the sandwich is gradually being eaten out and disappearing.", "chatgpt-answer": "C. gradually being eaten out and disappearing", "video-llm-prediction": "A person is seen making a sandwich with tomatoes and cream cheese. The sandwich is then cut into four pieces and eaten.", "gt-answer": "A. gradually reappearing piece by piece", "rating": 0 } ] }, "1059815936_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the paper is going through a transformation from a wrinkled paper ball into a flattened sheet, and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from a wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video showcases the transformation of a wrinkled paper ball into a flattened sheet, and then back into a wrinkled paper ball. The video emphasizes the process of transformation and the changes in the paper's appearance.", "gt-answer": "C. changing from a flattened sheet into a wrinkled paper ball", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the paper is transforming from a wrinkled paper ball into a flattened sheet, and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from a wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video showcases the transformation of a wrinkled paper ball into a flattened sheet, and then back into a wrinkled paper ball.", "gt-answer": "C. changing from a flattened sheet into a wrinkled paper ball", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the paper is being crumpled up and then flattened out. Hence, the correct answer is the option that describes this transformation.", "chatgpt-answer": "A. changing from a wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video shows a piece of paper being crumpled up and then flattened out.", "gt-answer": "C. changing from a flattened sheet into a wrinkled paper ball", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the paper is transforming from a wrinkled paper ball into a flattened sheet, and then back into a wrinkled paper ball.", "chatgpt-answer": "A. changing from a wrinkled paper ball into a flattened sheet", "video-llm-prediction": "The video showcases the transformation of a wrinkled paper ball into a flattened sheet, and then back into a wrinkled paper ball.", "gt-answer": "C. changing from a flattened sheet into a wrinkled paper ball", "rating": 0 } ] }, "1059718130_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the sun is appearing to rise faster than the clouds.", "chatgpt-answer": "B. rising faster than the sun below", "video-llm-prediction": "The video showcases the sun rising above the clouds, with the sun appearing to rise faster than the clouds. The video captures the beauty of the sun rising above the clouds, with the sun appearing to rise at the same speed as the clouds. The video is a visual representation of the sun rising above the clouds, with the sun appearing to rise faster than the clouds.", "gt-answer": "C. rising at the same speed as the sun below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun is seen rising slowly in the beginning, but gradually speeds up as the video progresses. This indicates that the sun is rising faster than the clouds.", "chatgpt-answer": "B. rising faster than the sun below", "video-llm-prediction": "The video showcases the sun rising above the clouds, with the sun appearing to rise faster than the clouds. The sun is seen rising slowly in the beginning, but gradually speeds up as the video progresses. The video captures the beauty of the sun rising above the clouds, with the sun appearing to rise faster than the clouds. The sun is seen rising slowly in the beginning, but gradually speeds up as the video progresses. The video captures the beauty of the sun rising above the clouds, with the sun appearing to rise faster than the clouds. The sun is seen rising slowly in the beginning, but gradually speeds", "gt-answer": "C. rising at the same speed as the sun below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the clouds are moving faster than the sun. Since the sun is rising, it can be inferred that the sun is rising slower than the clouds.", "chatgpt-answer": "A. rising slower than the sun below", "video-llm-prediction": "The sun is seen rising in the sky, with the clouds moving faster than the sun.", "gt-answer": "C. rising at the same speed as the sun below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun is seen rising slower than the clouds, indicating that the speed of the sun above is slower than the speed of the sun below.", "chatgpt-answer": "A. rising slower than the sun below", "video-llm-prediction": "The sun is seen rising in the sky, with the clouds moving faster than the sun. The sun is also seen rising slower than the clouds.", "gt-answer": "C. rising at the same speed as the sun below", "rating": 0 } ] }, "1059718130_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description states that \"the sun appears to rise faster than the sun below.\" This implies that the speed of the sun above is greater than the speed of the sun below.", "chatgpt-answer": "A. rising faster than the sun below", "video-llm-prediction": "The video features a beautiful sunset with the sun rising in the sky. The video starts with a close-up of the sun setting, and then it pans out to show the sun rising in the sky. The video captures the beauty of the sunset and the rising of the sun, with the sun appearing to rise faster than the sun below. The video is a perfect representation of the beauty of nature and the power of the sun.", "gt-answer": "B. rising slower than the sun below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun is seen rising in the sky, with the sun appearing to rise slower than the clouds. Therefore, the correct answer would be \"B. rising slower than the sun below.\"", "chatgpt-answer": "B. rising slower than the sun below", "video-llm-prediction": "The video showcases the sun rising in the sky, with the sun appearing to rise faster than the clouds. The sun is seen rising in the sky, with the sun appearing to rise slower than the clouds. The sun is seen rising in the sky, with the sun rising at the same speed as the clouds.", "gt-answer": "B. rising slower than the sun below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the sun is rising above the clouds, with the clouds moving faster than the sun below. This implies that the speed of the sun above is slower than the speed of the clouds below.", "chatgpt-answer": "B. rising slower than the sun below", "video-llm-prediction": "The video shows the sun rising above the clouds, with the clouds moving faster than the sun below.", "gt-answer": "B. rising slower than the sun below", "rating": 1 }, { "chatgpt-reasoning": "According to the video description, the sun is seen rising above the clouds, with the clouds moving faster than the sun below. Therefore, the correct answer is that the sun is rising slower than the sun below.", "chatgpt-answer": "B. rising slower than the sun below", "video-llm-prediction": "The sun is seen rising above the clouds, with the clouds moving faster than the sun below. The video captures the beauty of the sun rising above the clouds, with the clouds moving at a faster pace than the sun below.", "gt-answer": "B. rising slower than the sun below", "rating": 1 } ] }, "1059718130_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the sun appears to rise faster than the clouds, which means that the speed of the sun above is faster than the speed of the sun below.", "chatgpt-answer": "C. rising faster than the sun below", "video-llm-prediction": "The video shows the sun rising above the clouds, with the sun appearing to rise faster than the clouds. The video also shows the sun setting below the clouds, with the sun appearing to set slower than the clouds.", "gt-answer": "C. rising faster than the sun below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the sun appears to rise at a faster speed than the clouds.", "chatgpt-answer": "C. rising faster than the sun below", "video-llm-prediction": "The video showcases the sun rising above the clouds, with the sun appearing to rise at a faster speed than the clouds. The video captures the beauty of the sunrise, with the sun appearing to rise above the clouds. The video is a perfect representation of the sun rising above the clouds, with the sun appearing to rise at a faster speed than the clouds.", "gt-answer": "C. rising faster than the sun below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the sun above is rising slower than the sun below.", "chatgpt-answer": "B. rising slower than the sun below", "video-llm-prediction": "The video shows the sun rising in the sky, with the sun above rising at the same speed as the sun below. The sun is seen in the sky, with the sun above rising slower than the sun below. The video also shows the sun rising in the sky, with the sun above rising faster than the sun below.", "gt-answer": "C. rising faster than the sun below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun is rising in the sky, with the clouds moving in the same direction as the sun. Since the question asks about the speed of the sun, we can infer that the sun is rising at a certain speed. Therefore, the correct answer would be A. rising at the same speed as the sun below.", "chatgpt-answer": "A. rising at the same speed as the sun below", "video-llm-prediction": "The sun is seen rising in the sky, with the clouds moving in the same direction as the sun.", "gt-answer": "C. rising faster than the sun below", "rating": 0 } ] }, "1098153561_concat_0": { "speed": [ { "chatgpt-reasoning": "Based on the video description, there is no mention of the forest changing color. The description only mentions the varying sizes and colors of the trees, but it does not specify any changes in color over time. Therefore, we cannot determine the speed at which the forest above is changing color.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene forest with trees of varying sizes and colors. The camera pans up to show the trees from above, and the viewer can see the sun shining through the leaves. The camera then pans down to show the forest from below, and the viewer can see the ground and the sky. The video ends with the camera panning up to show the trees from above again.", "gt-answer": "B. at the same speed as the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed at which the forest above is changing color in comparison to the forest below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the beauty of nature with a focus on the vibrant colors of the trees. The camera pans up to show the trees from above, and the sun shines through the leaves, creating a stunning visual effect. The video also features a bird flying through the trees, adding to the serene atmosphere. The camera then pans down to show the trees from below, highlighting their grandeur and the intricate patterns of their branches. Overall, the video is a captivating tribute to the beauty of nature.", "gt-answer": "B. at the same speed as the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans up to show the trees from above and then pans down to show the forest from below. This implies that the changing color of the forest above is happening at a different speed compared to the forest below.", "chatgpt-answer": "A. faster than the forest below", "video-llm-prediction": "The video showcases a forest with yellowing leaves, and the camera pans up to show the trees from above. The camera then pans down to show the forest from below.", "gt-answer": "B. at the same speed as the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the camera pans up to capture the beauty of the trees, suggesting that the forest above is changing color at a different speed compared to the forest below.", "chatgpt-answer": "A. faster than the forest below", "video-llm-prediction": "The video showcases a serene forest with vibrant colors of yellow and orange leaves. The camera pans up to capture the beauty of the trees, and then pans down to show the ground. The video ends with a panoramic view of the forest.", "gt-answer": "B. at the same speed as the forest below", "rating": 0 } ] }, "1098153561_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the camera pans up to show the trees from above and then pans down to show the trees from below. This suggests that the forest above and the forest below are changing color at different speeds.", "chatgpt-answer": "A. slower than the forest below", "video-llm-prediction": "The video showcases a serene forest with trees of varying heights and colors. The camera pans up to show the trees from above, and then pans down to show the trees from below. The video captures the beauty of nature and the tranquility of the forest.", "gt-answer": "A. slower than the forest below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans up to show the trees from above, and then pans down to show the trees from below. This implies that the changing of colors in the forest above and below are being compared.", "chatgpt-answer": "C. at the same speed as the forest below", "video-llm-prediction": "The video showcases the beauty of nature, with a focus on the vibrant colors of the trees. The camera pans up to show the trees from above, and then pans down to show the trees from below. The video captures the changing colors of the leaves, from green to yellow, and then to orange. The camera also captures the sun shining through the trees, creating a serene and peaceful atmosphere. The video ends with a panoramic view of the forest, showcasing the vastness and beauty of nature.", "gt-answer": "A. slower than the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the camera pans up to show the trees from above and then pans down to show the trees from below. This suggests that both perspectives of the forest are shown in the video. Given that there is no specific information about the speed at which the color changes in either perspective, it is safe to assume that the video does not provide enough information to determine the speed of color change in the forest above compared to the forest below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a forest with trees of different sizes and colors. The camera pans up to show the trees from above, and then pans down to show the trees from below. The video also includes a shot of the forest from above, and a shot of the forest from below.", "gt-answer": "A. slower than the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans up and down to capture the beauty of the trees. It also mentions that the video starts with a slow pan up and ends with a slow pan down. However, it does not provide any information about the speed at which the color change is happening in the forest above compared to the forest below. Therefore, there is not enough information to determine the speed at which the forest above is changing color.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a serene forest with vibrant yellow leaves, and the camera pans up and down to capture the beauty of the trees. The video starts with a slow pan up, and the camera captures the beauty of the forest above. The camera then pans down, and the video ends with a slow pan down.", "gt-answer": "A. slower than the forest below", "rating": 0 } ] }, "1098153561_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the camera pans up and down to capture the vibrant colors of the leaves. It does not give any indication of different speeds for the color changes in different parts of the forest.", "chatgpt-answer": "C. at the same speed as the forest below", "video-llm-prediction": "The video showcases the beauty of nature with a focus on the changing colors of leaves in a forest. The camera pans up and down to capture the vibrant colors of the leaves, and the video ends with a panoramic view of the forest.", "gt-answer": "A. faster than the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there is a time-lapse effect which highlights the changing colors of the leaves. This suggests that the forest above is changing color at a faster pace compared to the forest below, as time-lapse effects often compress time and make changes appear faster than they actually are.", "chatgpt-answer": "A. faster than the forest below", "video-llm-prediction": "The video showcases the beauty of nature, with a focus on the vibrant colors of the trees during the fall season. The camera pans up to show the trees, and then down to show the ground below. The video also includes a time-lapse effect, which highlights the changing colors of the leaves. The video captures the essence of the fall season, with its warm and inviting colors, and the peacefulness of the forest.", "gt-answer": "A. faster than the forest below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the camera pans up and down to show the forest from different perspectives. However, it doesn't provide any specific information about the speed at which the color of the forest is changing.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a forest with yellowing leaves, and the camera pans up to show the trees from above. The camera then pans down to show the forest from below. The video ends with the camera panning up to show the trees from above again.", "gt-answer": "A. faster than the forest below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans up to show the trees filled with yellow and orange leaves, and then it pans down to show the ground covered in fallen leaves. This suggests that the trees are changing color faster than the fallen leaves on the ground.", "chatgpt-answer": "A. faster than the forest below", "video-llm-prediction": "The video showcases the beauty of nature as it captures the vibrant colors of the fall season. The camera pans up to show the trees, which are filled with yellow and orange leaves. The leaves are seen swaying in the wind, and the camera captures the movement of the leaves. The video then pans down to show the ground, which is covered in a blanket of fallen leaves. The camera captures the leaves as they blow around in the wind. The video ends with the camera panning up to show the trees once again. Overall, the video is a beautiful representation of the fall season", "gt-answer": "A. faster than the forest below", "rating": 1 } ] }, "1059462749_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the person climbing down is climbing faster than the person climbing above him.", "chatgpt-answer": "A. Climbing faster than the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing down. The man climbing down is seen climbing faster than the man climbing above him.", "gt-answer": "C. Climbing at the same speed as the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the man is climbing faster than the person below him.", "chatgpt-answer": "A. Climbing faster than the person below", "video-llm-prediction": "The video shows a man climbing a metal staircase, and he is seen climbing faster than the person below him. The man is wearing blue jeans and a blue shirt, and he is barefoot. The staircase is made of metal, and it is located in a public place. The man is seen climbing up the stairs while looking at the camera. The video captures the man's movements as he climbs up the stairs, and the camera angle changes as he climbs higher. The video ends with the man reaching the top of the staircase.", "gt-answer": "C. Climbing at the same speed as the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person climbing down is climbing faster than the person climbing above him.", "chatgpt-answer": "A. Climbing faster than the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing down. The man climbing down is seen climbing faster than the man climbing above him.", "gt-answer": "C. Climbing at the same speed as the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person climbing down is climbing faster than the person climbing above him.", "chatgpt-answer": "B. Climbing slower than the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing down. The man climbing down is seen climbing faster than the man climbing above him.", "gt-answer": "C. Climbing at the same speed as the person below", "rating": 0 } ] }, "1059462749_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the man climbing the ladder is seen climbing slower than the man climbing the stairs.", "chatgpt-answer": "A. Climbing slower than the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing up the stairs. The man climbing the ladder is seen climbing slower than the man climbing the stairs.", "gt-answer": "A. Climbing slower than the person below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man climbing the ladder is seen climbing slower than the man climbing the staircase.", "chatgpt-answer": "A. Climbing slower than the person below", "video-llm-prediction": "The video shows a man climbing a ladder while another man is climbing a staircase. The man climbing the ladder is seen climbing slower than the man climbing the staircase. The video captures the man climbing the ladder from different angles, and the man climbing the staircase is also seen from different angles. The video ends with the man climbing the ladder from the top.", "gt-answer": "A. Climbing slower than the person below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man in the foreground is climbing slower than the man in the background.", "chatgpt-answer": "A. Climbing slower than the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing a ladder in the background. The man in the foreground is climbing slower than the man in the background.", "gt-answer": "A. Climbing slower than the person below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the person climbing slower is above the person climbing faster.", "chatgpt-answer": "A. Climbing slower than the person below", "video-llm-prediction": "A man is seen climbing a ladder slowly while another man climbs it faster. The man climbing slower is above the man climbing faster.", "gt-answer": "A. Climbing slower than the person below", "rating": 1 } ] }, "1059462749_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the man climbing the ladder is climbing at the same speed as the man climbing the staircase.", "chatgpt-answer": "A. Climbing at the same speed as the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing a staircase. The man climbing the ladder is climbing at the same speed as the man climbing the staircase.", "gt-answer": "B. Climbing faster than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person climbing the ladder is seen climbing at the same speed as the person climbing the staircase.", "chatgpt-answer": "A. Climbing at the same speed as the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing a staircase. The man climbing the ladder is seen climbing at the same speed as the man climbing the staircase.", "gt-answer": "B. Climbing faster than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man in the foreground is climbing at the same speed as the man in the background. This means that both individuals are climbing at an equal pace.", "chatgpt-answer": "A. Climbing at the same speed as the person below", "video-llm-prediction": "A man is seen climbing a ladder while another man is climbing a ladder in the background. The man in the foreground is climbing at the same speed as the man in the background.", "gt-answer": "B. Climbing faster than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man in the foreground climbs at the same speed as the man in the background. Therefore, the correct answer is:", "chatgpt-answer": "A. Climbing at the same speed as the person below", "video-llm-prediction": "A man climbs a set of stairs while another man climbs a ladder in the background. The man in the foreground climbs at the same speed as the man in the background.", "gt-answer": "B. Climbing faster than the person below", "rating": 0 } ] }, "1059072773_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the ice cream is melting at different speeds, with one piece melting faster than the other.", "chatgpt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink background. The ice cream is shown melting at different speeds, with one piece melting faster than the other. The video also includes a piece of information that is not consistent with the video.", "gt-answer": "A. melting at the same speed as the ice cream below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the first scene displays the ice cream melting at the same speed as the ice cream below, meaning that the ice cream above is also melting at the same speed as the ice cream below.", "chatgpt-answer": "A. melting at the same speed as the ice cream below", "video-llm-prediction": "The video showcases the melting of ice cream in various ways. The first scene displays the ice cream melting at the same speed as the ice cream below. The second scene shows the ice cream melting faster than the ice cream below. Lastly, the third scene shows the ice cream melting slower than the ice cream below. The video highlights the different speeds at which ice cream melts, providing a visual representation of the process.", "gt-answer": "A. melting at the same speed as the ice cream below", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically mentions that one piece of ice cream is melting faster than the other. This implies that the speed of the ice cream above is different from the ice cream below.", "chatgpt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is seen melting at different speeds, with one piece melting faster than the other. The video also shows the ice cream dripping down in different shapes, including a cone and a swirl.", "gt-answer": "A. melting at the same speed as the ice cream below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the ice cream on the left melts faster than the ice cream on the right, and the ice cream on the right melts slower than the ice cream on the left.", "chatgpt-answer": "C. melting slower than the ice cream below", "video-llm-prediction": "The video showcases the melting of ice cream at different speeds. The ice cream on the left melts faster than the ice cream on the right. The ice cream on the right melts slower than the ice cream on the left.", "gt-answer": "A. melting at the same speed as the ice cream below", "rating": 0 } ] }, "1059072773_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description mentions that one piece of ice cream is melting slower than the others. That means the speed of the ice cream above is different from the speed of the ice cream below.", "chatgpt-answer": "A. melting slower than the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is seen melting at different speeds, with one piece melting slower than the others. The video also shows the ice cream melting in a liquid form.", "gt-answer": "A. melting slower than the ice cream below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ice cream is melting at different speeds, with some melting faster than others. This implies that there is a variation in the speed of melting between different parts of the ice cream.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the melting of ice cream on a pink background. The ice cream is seen melting at different speeds, with some melting faster than others. The video also highlights the contrast between the ice cream and the pink background.", "gt-answer": "A. melting slower than the ice cream below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the ice cream is melting at different speeds, with one piece melting faster than the other. Therefore, the ice cream above is melting Faster than the ice cream below.", "chatgpt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is seen melting at different speeds, with one piece melting faster than the other. The video also shows the ice cream melting in a liquid form.", "gt-answer": "A. melting slower than the ice cream below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the ice cream is melting at different speeds, with one piece melting slower than the other. Therefore, we can conclude that the speed of the ice cream above is melting slower than the ice cream below.", "chatgpt-answer": "A. melting slower than the ice cream below", "video-llm-prediction": "The video showcases the melting of ice cream on a pink surface. The ice cream is seen melting at different speeds, with one piece melting slower than the other. The video provides a close-up view of the ice cream melting, highlighting the different speeds at which it is melting. The video emphasizes the contrast between the ice cream that is melting faster and the ice cream that is melting slower. Overall, the video provides a visually appealing and informative demonstration of the melting process of ice cream.", "gt-answer": "A. melting slower than the ice cream below", "rating": 1 } ] }, "1059072773_concat_2": { "speed": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that the ice cream is shown melting at different speeds with one piece melting faster than the other. This indicates that the speed of the ice cream above is different from the speed of the ice cream below.", "chatgpt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is shown melting at different speeds, with one piece melting faster than the other. The video also includes a piece of information that is not consistent with the video.", "gt-answer": "B. melting faster than the ice cream below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ice cream is seen melting at different speeds, with one piece melting faster than the other. Therefore, the correct answer is B. melting faster than the ice cream below.", "chatgpt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is seen melting at different speeds, with one piece melting faster than the other. The video also shows the ice cream dripping down in different patterns.", "gt-answer": "B. melting faster than the ice cream below", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the ice cream is melting at the same speed as the ice cream below.", "chatgpt-answer": "A. melting at the same speed as the ice cream below", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface. The ice cream is melting at the same speed as the ice cream below.", "gt-answer": "B. melting faster than the ice cream below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the ice cream melts at different speeds, with one piece melting faster than the other. This means that the speed of the ice cream above is melting faster than the ice cream below.", "chatgpt-answer": "B. melting faster than the ice cream below", "video-llm-prediction": "The video showcases the melting of ice cream on a pink surface. The ice cream melts at different speeds, with one piece melting faster than the other. The video provides a close-up view of the ice cream melting, highlighting the different melting speeds.", "gt-answer": "B. melting faster than the ice cream below", "rating": 1 } ] }, "1090578917_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the man is seen performing the moves in slow motion. Therefore, the man is jumping at a slower speed than the man below.", "chatgpt-answer": "B. Slower than the man below", "video-llm-prediction": "The video shows a man performing a series of soccer moves, including dribbling, passing, and shooting. The man is seen running towards the goal and attempting to score. The video also shows the man falling down and getting back up. The man is wearing a soccer uniform and is surrounded by a crowd of people. The video is shot in a stadium with a large screen in the background. The man is seen performing the moves in slow motion, and the video is shot in high definition. The video ends with the man scoring a goal.", "gt-answer": "A. Jumping at the same speed as the man below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is performing a jump and a slide. It does not provide any information about another person below or their speed. Therefore, there is not enough information to answer the question.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man performing a series of soccer moves, including a jump and a slide. The man is seen wearing an orange shirt and black shorts, and he is surrounded by a large crowd. The video is shot in a stadium at night, and the man is seen performing the moves in front of a goal. The video ends with the man walking away from the goal.", "gt-answer": "A. Jumping at the same speed as the man below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man in the orange shirt is seen jumping at the same speed as another man in the same orange shirt, and also jumping at a slower speed than another man in an orange shirt. This implies that the man above is jumping at a slower speed than the man below.", "chatgpt-answer": "B. Slower than the man below", "video-llm-prediction": "A man in an orange shirt is seen jumping in front of a goal. He is seen jumping at the same speed as another man in the same orange shirt. The man in the orange shirt is also seen jumping in front of the goal at a slower speed than another man in an orange shirt.", "gt-answer": "A. Jumping at the same speed as the man below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man above jumps at the same speed as the man below, while also mentioning that the man above is slower than the man below. This means that the man above is jumping at a speed that is slower than the man below.", "chatgpt-answer": "B. Slower than the man below", "video-llm-prediction": "The man above jumps at the same speed as the man below, while the man above is slower than the man below.", "gt-answer": "A. Jumping at the same speed as the man below", "rating": 0 } ] }, "1090578917_concat_1": { "speed": [ { "chatgpt-reasoning": "Based on the video description, it states that the man in an orange shirt is jumping at the same speed as another man in an orange shirt who is also jumping in front of the goal. Therefore, the correct answer is:", "chatgpt-answer": "A. Jumping at the same speed as the man below", "video-llm-prediction": "A man in an orange shirt is seen jumping in front of a goal. He is seen jumping at the same speed as another man in an orange shirt who is also jumping in front of the goal. The man in the orange shirt is seen jumping slower than the man in the orange shirt who is jumping in front of the goal. The man in the orange shirt is also seen jumping faster than the man in the orange shirt who is jumping in front of the goal.", "gt-answer": "B. Slower than the man below", "rating": 0 }, { "chatgpt-reasoning": "The video describes that the man's jump is captured in slow motion, indicating that he is jumping slower than normal speed.", "chatgpt-answer": "B. Slower than the man below", "video-llm-prediction": "The video showcases a man performing a soccer move where he jumps and kicks the ball over another player. The man's jump is captured in slow motion, and the video also shows the man falling down on the field. The video is set in a soccer field with a crowd of people watching the game.", "gt-answer": "B. Slower than the man below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is performing a soccer move in front of a goal and then falls down onto the ground. There is no mention or indication of another person in the description, so we cannot compare the man's speed to another person.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man in an orange shirt is seen performing a soccer move in front of a goal. He then falls down onto the ground.", "gt-answer": "B. Slower than the man below", "rating": 0 }, { "chatgpt-reasoning": "According to the video description, the man above jumps at the same speed as the man below, but is slower than the man below. Therefore, the man above is jumping at a slower speed than the man below.", "chatgpt-answer": "B. Slower than the man below", "video-llm-prediction": "The man above jumps at the same speed as the man below, while the man above is slower than the man below.", "gt-answer": "B. Slower than the man below", "rating": 1 } ] }, "1090578917_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the man above and the man below are performing the same move, running towards the goal and then jumping to hit the ball. There is no indication in the description about the speed at which they are jumping.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man performing a soccer move on the field. He is seen running towards the goal and then jumping to hit the ball. The man is wearing an orange shirt and black shorts. The video also shows a man in a yellow shirt and black shorts performing the same move. The man in the yellow shirt is seen running towards the goal and then jumping to hit the ball. The video also shows a man in an orange shirt and black shorts performing the same move. The man in the orange shirt is seen running towards the goal and then jumping to hit the ball.", "gt-answer": "B. Faster than the man below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is performing a series of soccer moves, including a bicycle kick and a flip. Since the question asks about the speed of the man in the video while he is jumping, there is no information given in the video description that indicates whether the speed of the man jumping is faster, slower, or the same as the man below. Therefore, it is not possible to determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a man performing a series of soccer moves, including a bicycle kick and a flip. The man is seen wearing an orange shirt and black shorts, and the video is set in a stadium with a large crowd watching. The video starts with the man performing a bicycle kick, followed by a flip. The man then lays on the ground and performs a series of other soccer moves. The video ends with the man standing up and walking away.", "gt-answer": "B. Faster than the man below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man in the orange shirt is seen performing the move faster than another man in an orange shirt who is also performing the same move.", "chatgpt-answer": "B. Faster than the man below", "video-llm-prediction": "A man in an orange shirt is seen performing a soccer move in front of a goal. He jumps at the same speed as another man in an orange shirt who is also performing the same move. The man in the orange shirt is seen performing the move faster than another man in an orange shirt who is also performing the same move.", "gt-answer": "B. Faster than the man below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man above jumps at the same speed as the man below, while also mentioning that the man above is faster than the man below. Therefore, the man above cannot be jumping at the same speed as the man below or be slower than the man below. The only logical answer is that the man above is jumping faster than the man below.", "chatgpt-answer": "B. Faster than the man below", "video-llm-prediction": "The man above jumps at the same speed as the man below, while the man above is faster than the man below.", "gt-answer": "B. Faster than the man below", "rating": 1 } ] }, "1075338140_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the ball above is moving faster than the ball below.", "chatgpt-answer": "A. faster than the ball below", "video-llm-prediction": "The video shows a ball rolling on a surface, and the camera captures the ball from different angles. The video also includes a piece of information that the ball is moving faster than the ball below.", "gt-answer": "C. moving at the same speed as the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the ball above is moving slower than the ball below.", "chatgpt-answer": "B. slower than the ball below", "video-llm-prediction": "The video showcases a ball's movement on a blue background. The ball is seen moving at different speeds, including faster than the ball below and slower than the ball above. The video captures the ball's movement in detail, providing a mesmerizing visual experience.", "gt-answer": "C. moving at the same speed as the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the speed of the ball above is faster than the ball below.", "chatgpt-answer": "A. faster than the ball below", "video-llm-prediction": "The video shows a ball moving on a pink surface, and the speed of the ball is faster than the ball below. The video also shows a ball moving on a blue surface, and the speed of the ball is slower than the ball above.", "gt-answer": "C. moving at the same speed as the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the ball's speed is varying. Therefore, we cannot determine whether the ball is faster, slower, or moving at the same speed as the ball below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a ball's movement on a blue surface, with the ball's speed varying. The ball's movement is captured from different angles, and the video provides a detailed view of the ball's movement.", "gt-answer": "C. moving at the same speed as the ball below", "rating": 0 } ] }, "1075338140_concat_1": { "speed": [ { "chatgpt-reasoning": "From the video description, it is stated that the ball is initially moving faster than the surface, then at the same speed as the surface, and finally slower than the surface. Therefore, the speed of the ball above is slower than the ball below.", "chatgpt-answer": "C. slower than the ball below", "video-llm-prediction": "The video showcases a ball moving on a pink surface, with the ball moving faster than the surface. The video also features a close-up shot of the ball, which is moving at the same speed as the surface. The video ends with the ball moving slower than the surface.", "gt-answer": "C. slower than the ball below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ball is seen rolling faster than another ball, and later it is seen rolling slower than the other ball.", "chatgpt-answer": "A. faster than the ball below", "video-llm-prediction": "The video showcases a ball rolling on a surface, with the camera capturing its movement from different angles. The ball is seen rolling faster than another ball, and the camera captures the movement of both balls. The video also features a close-up shot of the ball, highlighting its texture and reflecting the light. The video ends with the ball rolling slower than the other ball, and the camera captures the movement of both balls.", "gt-answer": "C. slower than the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the ball moves at different speeds. However, it does not provide any information about another ball for comparison. Therefore, we cannot determine the speed of the ball relative to another ball.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video showcasing a ball rolling on a surface with a pink background. The ball moves at different speeds, and the background changes from blue to pink.", "gt-answer": "C. slower than the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the ball is seen moving at different speeds, with one instance showing it moving faster than the other.", "chatgpt-answer": "A. faster than the ball below", "video-llm-prediction": "A video showcasing a ball's movement on a pink surface is presented. The ball is seen moving at different speeds, with one instance showing it moving faster than the other. The video also features a close-up shot of the ball, highlighting its movement and texture.", "gt-answer": "C. slower than the ball below", "rating": 0 } ] }, "1075338140_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the ball is moving at different speeds. However, there is no mention or comparison of the speed of the ball above and below. Therefore, we cannot determine the speed of the ball above based on the provided information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a ball moving on a blue surface, and the camera captures the ball from different angles. The ball is seen moving at different speeds, and the camera captures the ball from different angles. The video ends with the ball still moving on the surface.", "gt-answer": "B. faster than the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the ball's speed varies throughout the video, from slow to fast. There is no mention of any other ball in the video description to compare the speed with.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a ball's movement on a blue surface, with the ball's speed varying throughout the video. The ball's movement is captured from different angles, providing a comprehensive view of its movement. The video highlights the ball's movement on the surface, with the ball's speed varying from slow to fast. The video's focus is on the ball's movement, and the viewer can appreciate the ball's movement from different angles. The video's overall message is to showcase the ball's movement on the surface, with the ball's speed varying throughout the video.", "gt-answer": "B. faster than the ball below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the ball is shown moving faster than the surface. This implies that the speed of the ball above is faster than the speed of the ball below.", "chatgpt-answer": "B. faster than the ball below", "video-llm-prediction": "The video shows a ball moving on a pink surface, and the camera zooms in on the ball. The ball is then shown moving faster than the surface.", "gt-answer": "B. faster than the ball below", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically states that the ball above is moving faster than the ball below.", "chatgpt-answer": "B. faster than the ball below", "video-llm-prediction": "The video showcases a ball moving on a blue surface, with the ball above moving faster than the ball below. The video captures the ball's movement in a mesmerizing way, with the ball's reflection adding to the visual appeal. The video's focus is solely on the ball's movement, with no other objects or elements present in the frame. The video's simplicity and elegance make it an excellent example of a minimalist video.", "gt-answer": "B. faster than the ball below", "rating": 1 } ] }, "1077575504_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the pile of salt above is growing at a faster speed than the pile of salt below.", "chatgpt-answer": "B. growing at a faster speed than the pile of salt below", "video-llm-prediction": "The video shows a pile of salt growing at a faster speed than the pile of salt below. The salt is being poured into a wooden bowl, and the pile of salt is growing at a faster speed than the pile of salt below. The video is a demonstration of the growth of salt.", "gt-answer": "A. growing at the same speed as the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the salt pile is growing at a steady pace. This implies that the speed of the pile of salt above is consistent with the speed of the pile of salt below.", "chatgpt-answer": "A. growing at the same speed as the pile of salt below", "video-llm-prediction": "The video showcases the process of salt being poured into a container, with the salt gradually filling up the container. The video starts with a close-up shot of the salt being poured, and as the video progresses, the salt gradually fills up the container. The video highlights the gradual increase in the amount of salt, with the salt pile growing at a steady pace. The video provides a visual representation of the process of salt being poured into a container, with the salt gradually filling up the container. The video is a great example of the process of salt being poured into a container, with the salt", "gt-answer": "A. growing at the same speed as the pile of salt below", "rating": 1 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the pile of salt. It only describes the pouring of salt into a bowl and then pouring it out. Therefore, there is not enough information to determine the speed of the pile of salt.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of salt being poured into a bowl and then being poured out of the bowl. The salt is shown in a close-up shot, and the video ends with the salt being poured out of the bowl.", "gt-answer": "A. growing at the same speed as the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the pile of salt above is seen growing at a slower speed than the pile of salt below.", "chatgpt-answer": "C. growing at a slower speed than the pile of salt below", "video-llm-prediction": "A pile of salt is shown, and it is seen growing at a slower speed than the pile of salt below. The video showcases the process of salt being poured into a wooden bowl, and the salt is seen growing at a faster speed than the pile of salt below.", "gt-answer": "A. growing at the same speed as the pile of salt below", "rating": 0 } ] }, "1077575504_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description states that initially, the salt pile above is growing at a faster speed than the pile of salt below. Then, it is mentioned that the salt pile above is growing at a slower speed than the pile of salt below. Finally, it is stated that the salt pile above is growing at the same speed as the pile of salt below.", "chatgpt-answer": "C. growing at the same speed as the pile of salt below", "video-llm-prediction": "The video shows a pile of salt growing at a faster speed than the pile of salt below it. The salt is being poured into a wooden bowl, and the video captures the process of the salt pile growing. The video also shows the salt pile growing at a slower speed than the pile of salt below it. The video ends with the salt pile growing at the same speed as the pile of salt below it.", "gt-answer": "B. growing at a slower speed than the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the salt is gradually filling the bowl. This implies that the speed of the pile of salt above is the same as the pile of salt below since they are both filling up at a gradual pace.", "chatgpt-answer": "C. growing at the same speed as the pile of salt below", "video-llm-prediction": "The video showcases the process of salt being poured into a wooden bowl, with the salt gradually filling the bowl. The video also features a close-up shot of the salt in the bowl, highlighting its texture and appearance. The video emphasizes the gradual filling of the bowl with salt, creating a visually captivating scene.", "gt-answer": "B. growing at a slower speed than the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the pile of salt above is growing at a faster speed than the pile of salt below.", "chatgpt-answer": "A. growing at a faster speed than the pile of salt below", "video-llm-prediction": "A video shows a pile of salt growing at a faster speed than the pile of salt below.", "gt-answer": "B. growing at a slower speed than the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there are two piles of salt being poured into the wooden bowl, and they are growing at different speeds. It specifically states that \"one pile of salt is growing faster than the other\". Therefore, the correct answer is A. growing at a faster speed than the pile of salt below.", "chatgpt-answer": "A. growing at a faster speed than the pile of salt below", "video-llm-prediction": "The video showcases the process of salt being poured into a wooden bowl, with the salt gradually filling the bowl. The video highlights the different speeds at which the salt is being poured, with one pile of salt growing faster than the other. The video emphasizes the visual impact of the salt being poured into the bowl, with the sound of the pouring salt adding to the overall sensory experience. The video is a simple yet effective demonstration of the process of pouring salt into a bowl, and the different speeds at which the salt is being poured add an element of intr", "gt-answer": "B. growing at a slower speed than the pile of salt below", "rating": 0 } ] }, "1077575504_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the pile of salt above is growing at a faster speed than the pile of salt below it. It specifically mentions that both piles are growing at the same speed.", "chatgpt-answer": "A. growing at the same speed as the pile of salt below", "video-llm-prediction": "The video shows a pile of salt growing at a faster speed than the pile of salt below it. The salt is being poured into a bowl, and the pile of salt is growing at the same speed as the pile of salt below it.", "gt-answer": "C. growing at a faster speed than the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the salt is gradually filling up the container. This indicates that the speed of the pile of salt above is growing at the same speed as the pile of salt below.", "chatgpt-answer": "A. growing at the same speed as the pile of salt below", "video-llm-prediction": "The video showcases the process of salt being poured into a container, with the salt gradually filling up the container. The video begins with a close-up shot of the salt being poured into the container, and as the video progresses, the salt gradually fills up the container. The video highlights the gradual filling of the container with salt, emphasizing the process of salt being poured into the container. The video provides a visual representation of the process of salt being poured into a container, with the salt gradually filling up the container.", "gt-answer": "C. growing at a faster speed than the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the salt is poured at a consistent speed and the camera pans out to show the entire process. This indicates that the speed of the pile of salt above is the same as the pile of salt below because both are being poured at the same consistent speed.", "chatgpt-answer": "A. growing at the same speed as the pile of salt below", "video-llm-prediction": "A video showcasing the process of salt being poured into a container. The video starts with a close-up shot of salt being poured into a container, and then the camera pans out to show the entire process. The salt is poured at a consistent speed, and the video ends with the container being filled with salt.", "gt-answer": "C. growing at a faster speed than the pile of salt below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the pile of salt above is growing at the same speed as the pile of salt below it.", "chatgpt-answer": "A. growing at the same speed as the pile of salt below", "video-llm-prediction": "The video shows a pile of salt growing at a faster speed than the pile of salt below it. The salt is being poured into a bowl, and the pile of salt is growing at the same speed as the pile of salt above it.", "gt-answer": "C. growing at a faster speed than the pile of salt below", "rating": 0 } ] }, "1100319395_concat_0": { "speed": [ { "chatgpt-reasoning": "According to the video description, the white circle above rotates faster than the white circle below it.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "The video features a white circle that rotates faster than a white circle below it. The white circle above rotates at the same speed as the white circle below it. The video also includes a white circle that rotates slower than the white circle below it.", "gt-answer": "C. rotating at the same speed as the white circle below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white circle above rotates faster than the white circle below it.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "The video features a white circle that rotates faster than a white circle below it. The white circle above rotates at the same speed as the white circle below it. The video also includes a white circle that rotates slower than the white circle above it.", "gt-answer": "C. rotating at the same speed as the white circle below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white circle above is spinning faster than the white circle below.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "The video shows a white circle spinning faster than another white circle.", "gt-answer": "C. rotating at the same speed as the white circle below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the white circle above rotates faster than the white circle below it.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "The video features a white circle that rotates faster than another white circle below it. The video also includes a white circle that rotates at the same speed as the circle below it.", "gt-answer": "C. rotating at the same speed as the white circle below", "rating": 0 } ] }, "1100319395_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the white circle above is spinning slower than the circle below it.", "chatgpt-answer": "C. slower than the white circle below", "video-llm-prediction": "The video shows a white circle spinning faster than a white circle below it. The white circle above it is also spinning at the same speed as the circle below it. The white circle above it is spinning slower than the circle below it.", "gt-answer": "A. faster than the white circle below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white circle above rotates faster than the white circle below it.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "The video features a white circle that rotates faster than a white circle below it. The video also includes a white circle that rotates at the same speed as the white circle below it. Additionally, there is a white circle that rotates slower than the white circle below it.", "gt-answer": "A. faster than the white circle below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the white circle above is spinning faster than another white circle. Therefore, the correct answer is A. faster than the white circle below.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "A white circle is shown spinning faster than another white circle.", "gt-answer": "A. faster than the white circle below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the white circle above rotates faster than the white circle below it.", "chatgpt-answer": "A. faster than the white circle below", "video-llm-prediction": "The video features a white circle that rotates faster than another white circle below it. The video also includes a white circle that rotates at the same speed as the circle below it. Additionally, there is a white circle that rotates slower than the circle below it.", "gt-answer": "A. faster than the white circle below", "rating": 1 } ] }, "1100319395_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the white circle above is rotating at the same speed as the white circle below.", "chatgpt-answer": "B. rotating at the same speed as the white circle below", "video-llm-prediction": "The video shows a white circle spinning faster than a white circle above it. The white circle above is rotating at the same speed as the white circle below.", "gt-answer": "A. slower than the white circle below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white circle above rotates at a different speed than the white circle below. It does not specify whether it is faster or slower, so it is unclear whether option A or C is correct. However, since the video ends with a white circle that rotates at a faster speed than the white circle above it, it can be inferred that the white circle above is rotating at a slower speed.", "chatgpt-answer": "A. slower than the white circle below", "video-llm-prediction": "The video features a white circle that rotates at different speeds, with a smaller white circle appearing above it. The video also includes a white circle with a black dot in the middle, which rotates at a slower speed than the white circle above it. The video ends with a white circle that rotates at a faster speed than the white circle above it.", "gt-answer": "A. slower than the white circle below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the white circle above is rotating at a slower speed than the white circle below it.", "chatgpt-answer": "A. slower than the white circle below", "video-llm-prediction": "A white circle rotates at a slower speed than a white circle below it.", "gt-answer": "A. slower than the white circle below", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the white circle above rotates at a slower speed than another white circle.", "chatgpt-answer": "A. slower than the white circle below", "video-llm-prediction": "The video features a white circle that rotates at a slower speed than another white circle. The video also includes a white circle that rotates at the same speed as the other white circle.", "gt-answer": "A. slower than the white circle below", "rating": 1 } ] }, "1086820415_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description mentions that some waves are appearing to move faster than others. This suggests that the speed of the wave above is moving faster than the wave below.", "chatgpt-answer": "B. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean and the power of its waves. The camera captures the movement of the waves, with some appearing to move faster than others. The waves are shown in various positions, with some crashing and others still moving. The video also includes a shot of a person surfing on the waves. Overall, the video provides a captivating view of the ocean and its waves.", "gt-answer": "A. Moving at the same speed as the wave below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that some waves are shown in various positions, with some crashing and others still in motion. Therefore, it can be inferred that the waves depicted in the video have different speeds.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the beauty of the ocean and the power of its waves. The camera captures the movement of the waves, with some appearing to move faster than others. The waves are shown in various positions, with some crashing and others still in motion. The video also features a close-up shot of a wave crashing, highlighting the power and force of the ocean. Overall, the video provides a mesmerizing view of the ocean and its waves, leaving the viewer in awe of the natural beauty.", "gt-answer": "A. Moving at the same speed as the wave below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the wave above is moving at the same speed as the wave below.", "chatgpt-answer": "A. Moving at the same speed as the wave below", "video-llm-prediction": "A large wave is seen crashing into the water, with the water splashing up and creating a beautiful display. The wave is moving at the same speed as the wave below it.", "gt-answer": "A. Moving at the same speed as the wave below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the waves are seen moving at different speeds, with some moving faster than others. Therefore, the speed of the wave above is moving faster than the wave below.", "chatgpt-answer": "B. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean with waves crashing against the water. The waves are seen moving at different speeds, with some moving faster than others. The video captures the power and beauty of the ocean, with the waves crashing against the water and creating a stunning visual display.", "gt-answer": "A. Moving at the same speed as the wave below", "rating": 0 } ] }, "1086820415_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description mentions that \"the camera captures the movement of the waves, with some appearing to move faster than others.\" This indicates that the wave above is moving faster than the wave below.", "chatgpt-answer": "A. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean and the power of its waves. The camera captures the movement of the waves, with some appearing to move faster than others. The waves crash against the water, creating a mesmerizing display of white foam. The camera also captures the movement of the waves from above, providing a unique perspective of the ocean's power. The video highlights the beauty of the ocean and the power of its waves, making it a must-see for anyone who appreciates the natural world.", "gt-answer": "A. Moving faster than the wave below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that \"some waves appear to move faster than others\". This indicates that the speed of the wave above is different from the wave below.", "chatgpt-answer": "A. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean and the power of its waves. The camera captures the movement of the waves, with some appearing to move faster than others. The waves are shown crashing against the water, creating a stunning display of nature's power. The video also highlights the contrast between the calmness of the water and the intensity of the waves. Overall, the video is a captivating tribute to the beauty of the ocean and the power of its waves.", "gt-answer": "A. Moving faster than the wave below", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically states that the wave above is moving faster than the wave below.", "chatgpt-answer": "A. Moving faster than the wave below", "video-llm-prediction": "The video shows a large wave crashing into the water, with the wave above moving faster than the wave below.", "gt-answer": "A. Moving faster than the wave below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the waves are seen moving at different speeds, with some moving faster than others. Therefore, the wave above must be moving faster than the wave below.", "chatgpt-answer": "A. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean with waves crashing and foam splashing. The waves are seen moving at different speeds, with some moving faster than others. The video captures the power and beauty of the ocean, with the waves crashing and creating a stunning display of nature.", "gt-answer": "A. Moving faster than the wave below", "rating": 1 } ] }, "1086820415_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description mentions that \"some waves appearing to move faster than others.\" This indicates that the speed of the wave above is faster than the wave below.", "chatgpt-answer": "C. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean and the power of its waves. The camera captures the movement of the waves, with some appearing to move faster than others. The waves are shown in various positions, from crashing against the shore to rolling in the open water. The video also highlights the power of the ocean, with a large wave crashing in the distance. Overall, the video provides a mesmerizing view of the ocean and its waves.", "gt-answer": "B. Moving slower than the wave below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"the waves are seen moving at different speeds, with some moving faster than others.\" Therefore, the speed of the wave above is moving faster than the wave below.", "chatgpt-answer": "C. Moving faster than the wave below.", "video-llm-prediction": "The video showcases the beauty of the ocean with its waves crashing and foaming. The waves are seen moving at different speeds, with some moving faster than others. The waves are also seen moving in different directions, with some moving upwards and others moving downwards. The video captures the power and beauty of the ocean, with its waves crashing and foaming. The waves are seen moving at different speeds, with some moving faster than others. The waves are also seen moving in different directions, with some moving upwards and others moving downwards. The video provides a mesmerizing view of the ocean and its", "gt-answer": "B. Moving slower than the wave below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that \"The wave above is moving slower than the wave below.\"", "chatgpt-answer": "B. Moving slower than the wave below", "video-llm-prediction": "The video shows a large wave crashing into the water, with the wave above moving at the same speed as the wave below. The wave above is moving slower than the wave below. The video captures the beauty and power of the ocean in motion.", "gt-answer": "B. Moving slower than the wave below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the waves are moving at different speeds, with some moving faster than others. Therefore, the speed of the wave above is moving faster than the wave below.", "chatgpt-answer": "C. Moving faster than the wave below", "video-llm-prediction": "The video showcases the beauty of the ocean with its waves crashing and creating a mesmerizing sight. The waves are seen moving at different speeds, with some moving faster than others. The video captures the movement of the waves from different angles, providing a comprehensive view of the ocean's power and beauty.", "gt-answer": "B. Moving slower than the wave below", "rating": 0 } ] }, "1096238125_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the man and the woman are lifting weights and then setting them down. However, it does not provide any information about the speed at which they are performing this action. Therefore, we cannot determine the speed of the two people above lifting the kettlebell based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman kneeling on a blue mat. The woman is holding a kettlebell while the man is holding a dumbbell. They are both lifting the weights and then setting them down. The video is consistent with the information that the woman is holding a kettlebell while the man is holding a dumbbell.", "gt-answer": "C. at the same speed as the two people below", "rating": 0 }, { "chatgpt-reasoning": "The speed at which the two people are lifting the kettlebell is not mentioned in the video description. Therefore, we cannot determine the speed of the two people based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman kneeling on the floor, with the woman holding a kettlebell. They are demonstrating how to do a proper squat with the kettlebell. The video is a tutorial on how to do a proper squat with a kettlebell. The woman in the video is wearing a grey tank top and black shorts, while the man is wearing a white t-shirt and black shorts. The video is shot in a gym with a weight rack in the background. The video is a great resource for anyone looking to improve their squat technique", "gt-answer": "C. at the same speed as the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the two people start lifting weights and then kneeling back down. However, it doesn't provide any information about the speed at which they are lifting the kettlebell. Therefore, there is not enough information to answer the question.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two people are seen kneeling on the floor, and they start lifting weights. The video shows them lifting weights and then kneeling back down.", "gt-answer": "C. at the same speed as the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed at which the two people are lifting the kettlebell. There is no information provided to determine whether they are lifting it slower, faster, or at the same speed as the two people below.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows two people kneeling on a blue mat, with one person holding a kettlebell. The other person is standing in front of them, and they are both speaking to the camera. The video then shows the two people standing in front of the camera, with the person holding the kettlebell now standing behind them. The video ends with the two people kneeling on the mat again.", "gt-answer": "C. at the same speed as the two people below", "rating": 0 } ] }, "1096238125_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed at which the two people are lifting the kettlebell. Therefore, we cannot determine the speed based on the given description.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a man and a woman kneeling on the floor, with the woman holding a kettlebell. The man is instructing the woman on how to lift the kettlebell, and she follows his instructions. The video emphasizes the importance of proper form and technique when lifting weights.", "gt-answer": "C. faster than the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed at which the two people are lifting the kettlebell. It only mentions that they are performing a specific exercise routine and provides a clear demonstration of the proper technique for performing it. Therefore, there is not enough information to determine the speed at which the two people are lifting the kettlebell.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows two people kneeling on the floor, with one person holding a weight and the other person holding a dumbbell. The person holding the weight lifts it up and then down again, while the other person also lifts their dumbbell up and down. The video seems to be focused on weightlifting exercises, with a particular emphasis on the use of dumbbells. The two people in the video are likely working on their strength and fitness, as they are performing a specific exercise routine. Overall, the video provides a clear demonstration of the proper technique for performing this", "gt-answer": "C. faster than the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description provides information about two people lifting a weight. However, it does not mention anything about the speed at which they are lifting the kettlebell or any comparison with other individuals. Therefore, there is not enough information to determine the speed of the two people above compared to the two people below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two people are seen kneeling on the floor, and one of them is holding a weight. They are both moving their arms around while the other person is holding onto the weight. The video seems to be focused on weightlifting and exercise.", "gt-answer": "C. faster than the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the two people above lifting the kettlebell compared to the two people below. Therefore, it is not possible to determine the speed based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows two people kneeling on a blue mat, with one person holding a weight. The other person is standing in front of them, and they are all moving their arms around. The video seems to be focused on strength training and proper form. The two people above are likely demonstrating a specific exercise or movement, while the two people below are following along and learning from their technique. Overall, the video is a helpful resource for anyone looking to improve their strength training routine.", "gt-answer": "C. faster than the two people below", "rating": 0 } ] }, "1096238125_concat_2": { "speed": [ { "chatgpt-reasoning": "Based on the video description, it is not mentioned that there are two people below lifting kettlebells, so we cannot determine the speed of the two people above compared to the two people below. Therefore, none of the choices are correct.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video shows a man and a woman performing a workout routine in a gym. The woman is seen kneeling down and lifting a weight while the man is standing next to her. The video also includes a collage of images of the two people performing the workout.", "gt-answer": "B. slower than the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man and woman are lifting weights up and down, indicating that they are performing repetitions of a weightlifting exercise. However, there is no mention or comparison to any other individuals in the video, so we cannot determine their speed relative to anyone else.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman performing a weightlifting exercise in a gym. The woman is kneeling down while the man is standing behind her. They are both holding weights and lifting them up and down. The video captures the intense physical activity and the focus on the weights.", "gt-answer": "B. slower than the two people below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that two people are working out, with one person holding a weight. However, there is no mention of any comparison or relation to the \"two people below\" in the description. Therefore, it is not possible to determine the speed of the two people above lifting the kettlebell.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two people are seen kneeling on a mat, with one person holding a weight. The other person is seen standing in front of them, and they all seem to be working out.", "gt-answer": "B. slower than the two people below", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, it is mentioned that the two people are seen standing and talking to each other while holding weights, which implies that they are lifting kettlebells. However, there is no information provided about any other people below or their speed. Therefore, we cannot determine the speed of the two people above compared to the two people below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "Two people are seen kneeling on a mat, and they start lifting weights. The video shows them performing various exercises, including squats and lifting weights. The two people are seen standing and talking to each other while holding weights. The video ends with the two people kneeling on the mat.", "gt-answer": "B. slower than the two people below", "rating": 0 } ] }, "1056433484_concat_0": { "speed": [ { "chatgpt-reasoning": "Based on the video description, it mentions that the Earth is spinning in space. Since the Earth rotates on its axis, the speed of the Earth above should be the same as the Earth below.", "chatgpt-answer": "B. rotates at the same speed as the earth below", "video-llm-prediction": "The video shows the Earth spinning in space, with the sun and moon visible in the background. The video also includes a shot of a solar eclipse.", "gt-answer": "B. rotates at the same speed as the earth below", "rating": 1 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the earth above. The video only describes the movement of a yellow ball on various screens. Therefore, we cannot determine the speed of the earth above based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a black and white screen with a yellow ball moving from the left to the right side of the screen. The screen then changes to a black background with a yellow ball moving from the left to the right side of the screen. The video then shows a black background with a yellow ball moving from the left to the right side of the screen. The video ends with a black and white screen with a yellow ball moving from the left to the right side of the screen.", "gt-answer": "B. rotates at the same speed as the earth below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the earth rotates at different speeds. It starts with the earth rotating faster than the moon, then they rotate at the same speed, and finally, the earth rotates slower than the moon.", "chatgpt-answer": "A. slower than the earth below", "video-llm-prediction": "The video shows the earth rotating at different speeds, with the moon and the earth in the background. The video starts with the earth rotating at a faster speed than the moon, and then the moon rotates at the same speed as the earth. Finally, the earth rotates at a slower speed than the moon.", "gt-answer": "B. rotates at the same speed as the earth below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the earth is rotating at a faster speed than the moon, which implies that the speed of the earth above is faster than the speed of the earth below.", "chatgpt-answer": "C. faster than the earth below", "video-llm-prediction": "The video showcases the earth rotating at a faster speed than the moon, which is also rotating. The video also features a black and white image of the earth and moon, with the earth appearing larger than the moon.", "gt-answer": "B. rotates at the same speed as the earth below", "rating": 0 } ] }, "1056433484_concat_1": { "speed": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that the planets are moving in different directions and some are moving faster than others. Since the video specifically mentions the movement of the planets and their rotation around the sun, it implies that the speed of the earth above would be different from the speed of the earth below.", "chatgpt-answer": "A. faster than the earth below", "video-llm-prediction": "The video shows a solar system with the sun at the center and the planets rotating around it. The video also shows the planets moving in different directions, with some moving faster than the others. The video emphasizes the movement of the planets and their rotation around the sun.", "gt-answer": "C. slower than the earth below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the first scene shows the earth rotating faster than the moon, the second scene shows the earth rotating at the same speed as the moon, and the third scene shows the earth rotating slower than the moon. Therefore, we can conclude that the speed of the earth above is rotating faster than the earth below.", "chatgpt-answer": "A. faster than the earth below", "video-llm-prediction": "The video showcases the movement of the earth and its rotation. The first scene displays the earth rotating faster than the moon, while the second scene shows the earth rotating at the same speed as the moon. The third scene shows the earth rotating slower than the moon. The video emphasizes the earth's movement and rotation, providing a visual representation of the earth's position in space.", "gt-answer": "C. slower than the earth below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the Earth rotates faster than the moon, indicating that the speed of the Earth above is different from the speed of the Earth below.", "chatgpt-answer": "A. faster than the earth below", "video-llm-prediction": "The video shows a solar system with the Earth and its moon. The Earth rotates faster than the moon, and the moon rotates at the same speed as the Earth.", "gt-answer": "C. slower than the earth below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the earth above is rotating faster than the earth below.", "chatgpt-answer": "A. faster than the earth below", "video-llm-prediction": "The video showcases the rotation of the earth in different speeds, with the earth above rotating faster than the earth below. The video also features a black and white background with a white ball and a black dot, and a black and white background with a white ball and a black dot.", "gt-answer": "C. slower than the earth below", "rating": 0 } ] }, "1056433484_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed of the earth above compared to the earth below. Therefore, it is not possible to determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a black and white screen with a large black dot in the middle. The dot is surrounded by a net and two smaller dots are seen moving around it. The video then shows a series of dots moving around the screen, with some of them appearing to be in motion. The dots are seen moving in different directions and at different speeds, creating a visually interesting and dynamic scene. The video seems to be showcasing the movement and motion of the dots, with the net and the black dot in the middle serving as a focal point. Overall, the video is a visually engaging", "gt-answer": "A. faster than the earth below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the Earth is rotating at a faster speed than the moon. This means that the speed of the Earth above is faster than the speed of the Earth below.", "chatgpt-answer": "A. faster than the earth below", "video-llm-prediction": "The video showcases the Earth rotating at a faster speed than the moon, which is also rotating at the same speed as the Earth. The video also features a black and white image of the Earth and the moon, as well as a black and white image of the Earth and the sun.", "gt-answer": "A. faster than the earth below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the earth is moving faster than the other planets. It also mentions that the earth is rotating at the same speed as the other planets. Therefore, the correct answer is A. faster than the earth below.", "chatgpt-answer": "A. faster than the earth below", "video-llm-prediction": "The video shows a solar system with the earth moving faster than the other planets. The earth is also shown rotating at the same speed as the other planets.", "gt-answer": "A. faster than the earth below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the video showcases the earth rotating above and below. Since it is not mentioned that the speed of rotation changes, we can infer that the speed of the earth above is the same as the speed of the earth below.", "chatgpt-answer": "B. rotates at the same speed as the earth below", "video-llm-prediction": "The video showcases the earth rotating above and below, with the sun and moon appearing in the background. The video emphasizes the earth's rotation and the sun's and moon's positions.", "gt-answer": "A. faster than the earth below", "rating": 0 } ] }, "15695290_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description states that \"The person is also seen drawing the house at the same speed as the person above.\" This indicates that the speed of the person above when drawing a picture is the same as the person below.", "chatgpt-answer": "B. at the same speed as the person below", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. The person is seen drawing the house at a faster speed than the person below. The person is also seen drawing the house at the same speed as the person above. The person is seen drawing the house at a slower speed than the person above.", "gt-answer": "B. at the same speed as the person below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a person is drawing a house on a piece of paper and then proceeds to draw a tree and flowers around the house. However, there is no mention or comparison made about the speed of the person above and the person below. Therefore, there is not enough information to answer the question.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. The person then proceeds to draw a tree and flowers around the house. The video showcases the process of drawing a house and its surroundings.", "gt-answer": "B. at the same speed as the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any comparison between the speed of the person drawing the picture and another person. Therefore, we cannot determine the speed of the person based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. The person then draws a tree and flowers around the house. The person then draws a person and a dog next to the house. The video ends with the person drawing a sun.", "gt-answer": "B. at the same speed as the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person drawing the house continues to draw the tree and flowers. This implies that the person is drawing at a slower speed than the person below who is only drawing a tree.", "chatgpt-answer": "C. slower than the person below", "video-llm-prediction": "A person is seen drawing a house on a piece of paper while another person is seen drawing a tree. The person drawing the house continues to draw the tree and flowers.", "gt-answer": "B. at the same speed as the person below", "rating": 0 } ] }, "15695290_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed of the person drawing. We only know the sequence of objects being drawn, but we cannot determine the speed based on that information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. The person then draws a tree and flowers. The person then draws a person and a dog. The person then draws a sun. The video ends with the person drawing a house again.", "gt-answer": "C. slower than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the person's drawing. It only describes their hand movements as deliberate and precise, indicating a high level of skill and experience in drawing. Therefore, we cannot determine the speed of the person above compared to the person below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a person drawing a house with a pencil on a white sheet of paper. The person starts by drawing a square and then adds a triangle on top of it. They then draw a line to connect the two shapes and add a window to the house. The video emphasizes the importance of precision and attention to detail in drawing. The person's hand movements are deliberate and precise, indicating a high level of skill and experience in drawing. The video is a great resource for anyone looking to improve their drawing skills, as it provides a detailed demonstration of the process of drawing a house. Overall, the", "gt-answer": "C. slower than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that both persons are drawing a house and a tree with a pencil. It does not provide any information about the speed of their drawing.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a person drawing a house with a pencil. The person draws the house with a pencil and then draws a tree. The video also shows a person drawing a house with a pencil and then drawing a tree.", "gt-answer": "C. slower than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed of the person drawing. Hence, there is not enough information to determine the speed of the person.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. The person then draws a tree next to the house. The person continues to draw more trees around the house. The video showcases the process of drawing a house and trees.", "gt-answer": "C. slower than the person below", "rating": 0 } ] }, "15695290_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description includes the actions performed by the person while drawing a house, a tree, and a person sitting in front of the house. However, there is no mention or comparison made about the speed of the person drawing in relation to another person. Therefore, we cannot determine the speed of the person based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. The person draws the house with a pencil and then draws a tree in front of the house. The person then draws a person sitting in front of the house. The video ends with the person drawing a tree in front of the house.", "gt-answer": "C. faster than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description doesn't provide any information about the speed of the person when drawing a picture. Therefore, there is not enough information to answer the question.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. They draw a tree and a few flowers around the house. The person then draws a person and a dog in front of the house. The video ends with the person drawing a tree and a few flowers around the house.", "gt-answer": "C. faster than the person below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person above is moving the pen faster than the person below.", "chatgpt-answer": "C. faster than the person below", "video-llm-prediction": "A person is drawing a house on a piece of paper with a blue pen. The person is moving the pen slowly, and the person above is moving the pen faster than the person below.", "gt-answer": "C. faster than the person below", "rating": 1 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed of the person drawing the picture. It only mentions the sequence of actions, such as drawing a house, tree, person, dog, cat, and then another tree. Therefore, we cannot determine the speed of the person based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A person is seen drawing a house on a piece of paper. They draw a tree in front of the house and then draw a person. The person then draws a dog and a cat. The video ends with the person drawing a tree in front of the house again.", "gt-answer": "C. faster than the person below", "rating": 0 } ] }, "1047368344_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that both women are running at the same speed. There is no mention of one woman running faster or slower than the other.", "chatgpt-answer": "A. running at the same speed as the girl below", "video-llm-prediction": "A woman is seen running on a dock while the camera captures her movements. She runs at the same speed as another woman who is also running on the dock. The woman running slower than the other woman is also seen running on the dock. The video captures the woman's movements as she runs on the dock.", "gt-answer": "A. running at the same speed as the girl below", "rating": 1 }, { "chatgpt-reasoning": "The video description does not provide any information about the girl's speed in comparison to another girl. Therefore, there is not enough information to determine the speed of the girl.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman running on a wooden bridge over a body of water. She is wearing a yellow dress and is captured from different angles. The video also includes a scene where the woman is seen running on the same bridge, but this time she is wearing a yellow dress. The video captures the beauty of the surrounding nature, with trees and mountains visible in the background. The woman's running form is impressive, and she appears to be enjoying the experience. The video is a great representation of the beauty of nature and the joy of running.", "gt-answer": "A. running at the same speed as the girl below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is running and jumping into the water. There is no mention of any comparison or reference to another person's speed, so it cannot be determined whether she is running faster or slower than anyone else. Therefore, none of the choices are correct.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A woman in a yellow dress is seen running on a dock and jumping into the water.", "gt-answer": "A. running at the same speed as the girl below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girl is running on a wooden pier and then jumps into the water and swims towards the shore. There is no mention of another girl or any comparison to another person's speed, so we cannot determine whether the girl is running at the same speed, slower, or faster than anyone else.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A girl in a yellow dress is seen running on a wooden pier. She then jumps into the water and swims towards the shore.", "gt-answer": "A. running at the same speed as the girl below", "rating": 0 } ] }, "1047368344_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the girl above is running at a slower pace than the girl below her.", "chatgpt-answer": "A. running slower than the girl below", "video-llm-prediction": "A girl in a yellow dress is seen running on a wooden bridge over a lake. She is running at a slower pace than the girl below her. The video captures the serene beauty of the lake and the surrounding mountains.", "gt-answer": "A. running slower than the girl below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is seen running on the pier. However, it doesn't specify the speed at which she is running. Therefore, we cannot determine the exact speed of the girl based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman wearing a yellow dress who is seen dancing on a wooden pier. She is captured in various poses, including jumping and spinning. The video also features a yellow bird flying over the water. The woman is seen running on the pier, and the video ends with her jumping into the water.", "gt-answer": "A. running slower than the girl below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the girl in the yellow dress is running at a slower pace than the girl below her.", "chatgpt-answer": "A. running slower than the girl below", "video-llm-prediction": "A girl in a yellow dress is seen running on a wooden bridge. She is running at a slower pace than the girl below her. The video captures her running on the bridge while the camera pans around her.", "gt-answer": "A. running slower than the girl below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the girl in the yellow dress is running faster than the other girl. This implies that she is running at a higher speed compared to the girl below.", "chatgpt-answer": "C. running faster than the girl below", "video-llm-prediction": "A girl in a yellow dress is seen running on a dock, while another girl in a yellow dress is also running on the dock. The video captures the girl in the yellow dress running faster than the other girl.", "gt-answer": "A. running slower than the girl below", "rating": 0 } ] }, "1047368344_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the girl above is running faster than the girl below.", "chatgpt-answer": "C. running faster than the girl below", "video-llm-prediction": "The video shows a girl running on a wooden bridge over a lake. She is wearing a yellow dress and is running at the same speed as the girl below. The video also shows a woman in a yellow dress running on the same bridge. The woman is running slower than the girl below. The video also shows a girl in a yellow dress running on the same bridge. The girl is running faster than the girl below.", "gt-answer": "C. running faster than the girl below", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman in the yellow dress is running at different speeds, sometimes faster and sometimes slower than the other woman. This implies that she is not running at the same speed as the girl below, so option A is incorrect. Additionally, since there is no specific mention of her consistently running slower or consistently running faster than the girl below, we cannot determine if she is running slower or faster, making options B and C also incorrect.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman in a yellow dress running on a wooden bridge over a lake. She is seen running at different speeds, sometimes faster and sometimes slower than the other woman. The video captures the beauty of the surrounding landscape, with trees and mountains visible in the background. The woman's movements are graceful and fluid, and she appears to be enjoying the experience. The video is a perfect representation of the joy and freedom that comes with running in nature.", "gt-answer": "C. running faster than the girl below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the girl in the yellow dress is running at a slower speed than the other girl.", "chatgpt-answer": "B. running slower than the girl below", "video-llm-prediction": "A girl in a yellow dress is seen running across a wooden bridge. She is running at the same speed as another girl who is also running across the bridge. The girl in the yellow dress is also seen running across the bridge at a slower speed than the other girl.", "gt-answer": "C. running faster than the girl below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the girl is running at the same speed as another girl who is also running on the pier.", "chatgpt-answer": "A. running at the same speed as the girl below", "video-llm-prediction": "A girl in a yellow dress is seen running on a wooden pier. She is running at the same speed as another girl who is also running on the pier. The video captures the girl's movements as she runs along the pier, with the water and surrounding trees in the background. The video showcases the beauty of the natural surroundings and the joy of running in the great outdoors.", "gt-answer": "C. running faster than the girl below", "rating": 0 } ] }, "1060403198_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description states that the first scene shows the tree growing slowly, while the second scene shows the tree growing faster. Therefore, the tree above is growing faster than the tree below.", "chatgpt-answer": "B. growing faster than the tree below", "video-llm-prediction": "The video shows a tree growing at different speeds in different environments. The first scene shows the tree growing slowly, while the second scene shows the tree growing faster. The third scene shows the tree growing at the same speed as the tree below. The video emphasizes the importance of patience and perseverance in achieving one's goals.", "gt-answer": "C. growing at the same speed as the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there are two trees, one with a slower growth rate and the other with a faster growth rate. The video transitions between shots of the slower-growing tree and the faster-growing tree. Therefore, the speed of the tree above is growing slower than the tree below.", "chatgpt-answer": "A. growing slower than the tree below", "video-llm-prediction": "The video showcases two different trees, one with a slower growth rate and the other with a faster growth rate. The video starts with a close-up shot of the tree with a slower growth rate, and then it transitions to a shot of the tree with a faster growth rate. The video then shows the tree with a slower growth rate again, followed by a shot of the tree with a faster growth rate. The video ends with a shot of the tree with a slower growth rate. The video emphasizes the differences in the growth rates of the two trees, with the slower-growing tree appearing to be more stable and", "gt-answer": "C. growing at the same speed as the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that one tree is growing slower than the other. It also mentions that the other tree is growing at the same speed as the tree below.", "chatgpt-answer": "C. growing at the same speed as the tree below", "video-llm-prediction": "The video shows two trees with different growth speeds. One tree is growing slower than the other, while the other is growing at the same speed. The video also shows the growth of the trees over time.", "gt-answer": "C. growing at the same speed as the tree below", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the first tree is growing slower than the second tree, which is growing at the same speed as the first tree.", "chatgpt-answer": "A. growing slower than the tree below", "video-llm-prediction": "The video showcases two trees with different growth speeds. The first tree is growing slower than the second tree, which is growing at the same speed as the first tree. The video provides a visual representation of the growth of the trees, highlighting the differences in their growth rates.", "gt-answer": "C. growing at the same speed as the tree below", "rating": 0 } ] }, "1060403198_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description states that the tree above is growing at the same speed as the tree below, slower than the tree below, and faster than the tree below. Only option A, \"growing at the same speed as the tree below,\" matches all three statements in the video description.", "chatgpt-answer": "A. growing at the same speed as the tree below", "video-llm-prediction": "The video shows a tree growing at the same speed as the tree below. The tree is shown growing at a slower pace than the tree below. The video also shows the tree growing at a faster pace than the tree below.", "gt-answer": "C. growing faster than the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video showcases the growth of a tree, focusing on its branches and leaves. It doesn't provide any specific information about the speed of the tree's growth compared to another tree. Therefore, we cannot determine the speed of the tree based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases the growth of a tree, with a focus on its branches and leaves. The video starts with a close-up shot of the tree, and then transitions to a wider shot that shows the tree in its surroundings. The camera then zooms in on the tree's branches and leaves, providing a detailed view of their structure and texture. The video ends with a shot of the tree from afar, showcasing its grandeur and beauty. Overall, the video provides a captivating and immersive experience of the tree's growth and development.", "gt-answer": "C. growing faster than the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the tree above is growing at the same speed as the tree below.", "chatgpt-answer": "A. growing at the same speed as the tree below", "video-llm-prediction": "A tree is shown growing at the same speed as another tree below it.", "gt-answer": "C. growing faster than the tree below", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, it is clear that the tree above goes through three different stages of growth speed: initially growing at the same speed as the tree below, then growing slower than the tree below, and finally growing faster than the tree below.", "chatgpt-answer": "C. growing faster than the tree below", "video-llm-prediction": "A tree is shown growing at the same speed as another tree below it. The video then shows the tree growing slower than the tree below it. Finally, the video shows the tree growing faster than the tree below it.", "gt-answer": "C. growing faster than the tree below", "rating": 1 } ] }, "1060403198_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the tree above is growing faster than one tree below, growing at the same speed as another tree below, and growing slower than another tree below. This indicates that the tree above is exhibiting all three speeds mentioned.", "chatgpt-answer": "A. growing faster than the tree below, B. growing at the same speed as the tree below, C. growing slower than the tree below", "video-llm-prediction": "The video shows a tree growing faster than another tree below it. The video also shows a tree growing at the same speed as another tree below it. The video also shows a tree growing slower than another tree below it.", "gt-answer": "C. growing slower than the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions the growth of a tree, but it doesn't provide any specific details about the speed of the tree. Therefore, we cannot determine the speed of the tree based on the given information.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases the growth of a tree, with a focus on its branches and leaves. The video starts with a close-up shot of the tree, and then transitions to a wider shot that shows the tree in its surroundings. The camera then pans out to show the tree from a distance, highlighting its size and grandeur. The video ends with a shot of the tree in the distance, emphasizing its beauty and majesty.", "gt-answer": "C. growing slower than the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the tree above is growing faster than the tree below it.", "chatgpt-answer": "A. growing faster than the tree below", "video-llm-prediction": "A tree is shown growing faster than another tree below it.", "gt-answer": "C. growing slower than the tree below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the tree in the foreground is growing at a faster pace than the tree in the background.", "chatgpt-answer": "A. growing faster than the tree below", "video-llm-prediction": "A tree is shown growing at a faster pace than another tree in the background. The video showcases the growth of the tree in the foreground, while the other tree remains stationary. The video highlights the contrast between the two trees, with the faster-growing tree appearing more vibrant and lively. The video provides a visual representation of the growth of the tree, with the viewer being able to observe the changes in the tree's appearance over time. Overall, the video is a beautiful representation of the growth of a tree and the contrast between the two trees in the background.", "gt-answer": "C. growing slower than the tree below", "rating": 0 } ] }, "1100058499_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the man starts jumping rope at a slower pace and gradually increases his speed until he is jumping at a faster pace. It is implied that the \"man above\" refers to the man who starts at a slower pace and increases his speed, while the \"man below\" is not mentioned in the video description. Therefore, we can infer that the man above is jumping rope faster than the man below.", "chatgpt-answer": "A. jumping rope faster", "video-llm-prediction": "A man is seen jumping rope in a gym. He starts off by jumping at a slower pace and gradually increases his speed until he is jumping at a faster pace. The man continues to jump rope at the faster pace while the camera captures his movements.", "gt-answer": "B. jumping rope at the same speed", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man starts jumping rope at a slower speed, then gradually increases his speed until he is jumping rope at the same speed as before. However, the video ends with the man jumping rope faster than before. So, the correct answer would be that the speed of the man above is jumping rope faster compared to the man below.", "chatgpt-answer": "A. jumping rope faster", "video-llm-prediction": "The video showcases a man jumping rope in a gym. He starts by jumping rope at a slower speed, then gradually increases his speed until he is jumping rope at the same speed as before. The video ends with the man jumping rope faster than before.", "gt-answer": "B. jumping rope at the same speed", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the man starts jumping at a slow pace and gradually increases his speed until he reaches his maximum speed. There is no mention of another man in the video, so it cannot be compared to any other person.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man jumping rope in a gym. He starts by jumping at a slow pace and gradually increases his speed. He jumps faster and faster until he reaches his maximum speed.", "gt-answer": "B. jumping rope at the same speed", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is jumping rope at different speeds, including faster and slower. It also mentions that he is shown jumping rope in a dark room. Therefore, we can infer that the speed of the man above is different from the speed of the man below.", "chatgpt-answer": "B. jumping rope at the same speed", "video-llm-prediction": "The man in the video is seen jumping rope at different speeds, including faster and slower. He is also shown jumping rope in a dark room.", "gt-answer": "B. jumping rope at the same speed", "rating": 1 } ] }, "1100058499_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the man starts jumping rope slowly, gradually increases his speed, continues jumping rope at a faster speed, and then slows down again. The video ends with him jumping rope at the same speed as he started. This indicates that the speed of the man above is the same as the speed of the man below.", "chatgpt-answer": "C. jumping rope at the same speed", "video-llm-prediction": "The video shows a man jumping rope in a gym. He starts by jumping rope slowly and gradually increases his speed. He continues jumping rope at a faster speed and then slows down again. The video ends with him jumping rope at the same speed as he started.", "gt-answer": "B. jumping rope slower", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the man starts by jumping rope at a slower pace and gradually increases his speed. It further mentions that the man then jumps rope at a faster pace, showcasing his agility. Therefore, the speed of the man in the video is faster compared to the man below.", "chatgpt-answer": "A. jumping rope faster", "video-llm-prediction": "The video showcases a man performing a jump rope routine in a gym. He starts by jumping rope at a slower pace and gradually increases his speed. The man then jumps rope at a faster pace, showcasing his agility and coordination. Throughout the video, the man maintains a consistent rhythm and form, demonstrating his skill and dedication to the sport. The gym setting provides a backdrop for the man's impressive display of athleticism, and the video captures the intensity and focus required to perform such a routine. Overall, the video is a test", "gt-answer": "B. jumping rope slower", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man starts by jumping rope slowly, then speeds up and jumps rope faster. Finally, he returns to jumping rope at the same speed as before. This means that the speed of the man above is changing, while the speed of the man below remains constant.", "chatgpt-answer": "B. jumping rope slower", "video-llm-prediction": "The man in the video is jumping rope at different speeds. He starts by jumping rope slowly, then speeds up and jumps rope faster. Finally, he returns to jumping rope at the same speed as before.", "gt-answer": "B. jumping rope slower", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man in the video is seen jumping rope at different speeds, including faster and slower. It also mentions that he is shown jumping rope in front of a mirror. Based on this information, we can conclude that the speed of the man above is different from the speed of the man below, so they are not jumping rope at the same speed.", "chatgpt-answer": "C. jumping rope at the same speed", "video-llm-prediction": "The man in the video is seen jumping rope at different speeds, including faster and slower. He is also shown jumping rope in front of a mirror.", "gt-answer": "B. jumping rope slower", "rating": 0 } ] }, "1100058499_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the man starts jumping rope slowly and gradually increases his speed. However, it also mentions that he ends the video jumping rope at the same speed as he started. Therefore, the speed of the man above is jumping rope at the same speed as the man below.", "chatgpt-answer": "C. jumping rope at the same speed", "video-llm-prediction": "The video shows a man jumping rope in a gym. He starts by jumping rope slowly and gradually increases his speed. He then jumps rope faster and faster until he reaches his maximum speed. The video ends with him jumping rope at the same speed as he started.", "gt-answer": "A. jumping rope faster", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man starts jumping rope at a slower pace and gradually increases his speed. It implies that the speed of the man above is faster than the man below, as no information is provided about another person jumping rope at the same time.", "chatgpt-answer": "A. jumping rope faster", "video-llm-prediction": "The video showcases a man performing a jump rope routine in a gym. He starts by jumping rope at a slower pace and gradually increases his speed. The man's movements are fluid and controlled, and he maintains a steady rhythm throughout the routine. The gym is well-lit, with a variety of exercise equipment visible in the background. The man's form is excellent, and he appears to be in excellent physical shape. Overall, the video is a great example of how jump rope can be used as a form of exercise and a way to improve cardiovascular fitness.", "gt-answer": "A. jumping rope faster", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man starts off slow and gradually speeds up while jumping rope. This implies that the speed of the man above is increasing. Without any mention of another man or a different scenario, we cannot compare the speed of the man above with any other individual. Therefore, it can be inferred that we do not have enough information to determine the speed of the man above in comparison to the man below.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen jumping rope in a gym. He starts off slow and gradually speeds up.", "gt-answer": "A. jumping rope faster", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is jumping rope at different speeds, including faster and slower. Therefore, we can conclude that the speed of the man above is different from the speed of the man below.", "chatgpt-answer": "C. jumping rope at the same speed", "video-llm-prediction": "The man in the video is seen jumping rope at different speeds, including faster and slower. He is also shown jumping rope in a dark room.", "gt-answer": "A. jumping rope faster", "rating": 0 } ] }, "1092813279_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description explicitly mentions that there are two women doing push-ups at the same speed. Therefore, option B is the correct answer.", "chatgpt-answer": "B. two women doing push ups at the same speed", "video-llm-prediction": "The video shows a woman performing push-ups on a red ground. She is wearing a black sports kit and is doing the exercise at a slow speed. The video also shows another woman doing push-ups at the same speed. The video is shot in a park, and there are trees and buildings in the background.", "gt-answer": "B. two women doing push ups at the same speed", "rating": 1 }, { "chatgpt-reasoning": "The video description does not provide any information about the speed at which the women are doing push-ups. It only mentions that the woman is doing push-ups on a playground and emphasizes the importance of physical activity. Therefore, we cannot determine which woman is doing push-ups slower based on the video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman performing push-ups on a playground. She starts by lying on the ground and then proceeds to do several push-ups. The video emphasizes the importance of physical activity and exercise, particularly in outdoor settings. The woman's form is excellent, and she appears to be in good physical shape. The playground provides a fun and engaging environment for exercise, and the video encourages viewers to take advantage of their surroundings to stay active. Overall, the video is a great reminder of the benefits of incorporating physical activity into our daily lives, no matter where we", "gt-answer": "B. two women doing push ups at the same speed", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is doing push ups at a slow speed.", "chatgpt-answer": "A. the woman below", "video-llm-prediction": "A woman is seen doing push ups on a playground. She is wearing a black sports bra and black shorts. The video shows her doing push ups at a slow speed.", "gt-answer": "B. two women doing push ups at the same speed", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman starts doing push-ups slowly and gradually increases her speed, while the second woman does push-ups at the same speed as the first woman. Therefore, the woman below is doing push-ups slower.", "chatgpt-answer": "A. the woman below", "video-llm-prediction": "The video showcases a woman performing push-ups on a playground. She starts by doing them slowly and gradually increases her speed. The video also features another woman doing push-ups at the same speed as the first woman. The video emphasizes the importance of proper form and technique when performing push-ups.", "gt-answer": "B. two women doing push ups at the same speed", "rating": 0 } ] }, "1092813279_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the video is in slow motion, which implies that both women are doing push-ups at the same speed.", "chatgpt-answer": "C. two women doing push ups at the same speed", "video-llm-prediction": "The video shows a woman performing push-ups on a playground. She is wearing a black sports bra and black shorts. The video is in slow motion, and the woman is shown doing push-ups in different positions. The video also shows a woman doing push-ups on a bench. The video is consistent with the information that the woman is doing push-ups on a playground.", "gt-answer": "B. the woman above", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the second woman is performing push-ups at the same speed as the first woman. Therefore, the correct answer is:", "chatgpt-answer": "C. two women doing push-ups at the same speed", "video-llm-prediction": "The video showcases a woman performing a series of push-ups on a playground. The video starts with a woman lying on the ground and then proceeds to show her performing push-ups. The video then shows a second woman performing push-ups at the same speed as the first woman. The video ends with the first woman continuing to perform push-ups. The video highlights the importance of physical fitness and the benefits of incorporating exercise into one's daily routine.", "gt-answer": "B. the woman above", "rating": 0 }, { "chatgpt-reasoning": "The video description states that there is only one woman doing push ups, so there are no two women to compare their speeds. Therefore, the answer is \"None of the choices are correct\".", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A woman is seen doing push ups on a playground. She is wearing a black sports bra and black shorts. The video shows her doing push ups on a red ground.", "gt-answer": "B. the woman above", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video includes a side-by-side comparison of the woman's movements, highlighting the different techniques she employs. It does not mention anything about the speed of their push-ups. Therefore, we cannot determine which woman is doing push-ups slower based on the provided information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman performing push-ups on a playground. She starts by doing them on her knees and then progresses to doing them on her elbows. The video also includes a side-by-side comparison of the woman's movements, highlighting the different techniques she employs. The video emphasizes the importance of proper form and technique when performing push-ups, and it serves as a helpful guide for those looking to improve their own technique.", "gt-answer": "B. the woman above", "rating": 0 } ] }, "1092813279_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description states that the woman is doing push ups at a slow speed, which means she is slower than the other two women.", "chatgpt-answer": "A. the woman above", "video-llm-prediction": "A woman is shown doing push ups on a red ground. She is wearing a black sports kit and is doing push ups at a slow speed.", "gt-answer": "C. the woman below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman starts by doing push-ups on her knees, then stands up and continues with push-ups, and ends with push-ups on her knees again. Since it is mentioned that the video showcases only one woman, it can be concluded that there is no other woman in the video. Therefore, there are no multiple women to compare their speed of performing push-ups, so the answer would be \"None of the choices are correct\".", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman performing push-ups on a red-colored gym floor. She is wearing a black sports bra and black shorts, and her hair is tied up in a ponytail. The video starts with her doing push-ups on her knees, and then she stands up and continues doing push-ups. The video ends with her doing push-ups on her knees again.", "gt-answer": "C. the woman below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there are two women doing push-ups on the red ground. It does not provide any information about the speed at which they are doing push-ups. Therefore, it is not possible to determine which woman is doing push-ups slower based on the provided information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a woman performing push-ups on a red ground. She starts by doing push-ups on her knees and then continues to do them on her elbows. The video also shows another woman doing push-ups on the same ground. The video emphasizes the importance of physical fitness and the benefits of regular exercise.", "gt-answer": "C. the woman below", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention anything about the speed at which the women are doing push-ups. Therefore, we cannot determine who is doing push ups slower based on the video description.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman performing push-ups on a playground. She starts by doing push-ups on her knees and then progresses to doing them on her elbows. The video emphasizes the importance of proper form and technique when performing push-ups.", "gt-answer": "C. the woman below", "rating": 0 } ] }, "1084518106_concat_0": { "speed": [ { "chatgpt-reasoning": "According to the video description, the truck is seen driving at the same speed as another truck that is driving below it. It is also mentioned that the truck is driving faster than the truck below it and slower than the truck below it. These statements create a paradox and cannot all be true simultaneously. Therefore, none of the choices are correct.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A truck is seen driving down a road with a field on either side. The truck is driving at the same speed as another truck that is driving below it. The truck is seen driving faster than the truck below it. The truck is also seen driving slower than the truck below it.", "gt-answer": "A. driving at the same speed as the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the truck above is seen driving at the same speed as the truck below, and it is also seen driving faster than the truck below.", "chatgpt-answer": "B. driving faster than the truck below", "video-llm-prediction": "The video showcases a truck driving down a highway, passing by a field of wheat. The truck is seen driving at the same speed as the truck below, and it is also seen driving faster than the truck below. The video captures the beauty of the wheat field and the tranquility of the highway.", "gt-answer": "A. driving at the same speed as the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the truck above is driving at the same speed as the truck below.", "chatgpt-answer": "A. driving at the same speed as the truck below", "video-llm-prediction": "A truck is driving on a road with a field on both sides. The truck is driving at the same speed as the truck below.", "gt-answer": "A. driving at the same speed as the truck below", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the truck above is driving at the same speed as the truck below.", "chatgpt-answer": "A. driving at the same speed as the truck below", "video-llm-prediction": "A truck is seen driving on a highway, passing by a field of wheat. The truck is driving at the same speed as the truck below.", "gt-answer": "A. driving at the same speed as the truck below", "rating": 1 } ] }, "1084518106_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description explicitly states that the truck above is driving at the same speed as the truck below.", "chatgpt-answer": "C. driving at the same speed as the truck below", "video-llm-prediction": "A truck is seen driving on a road with a field on either side. The truck is driving at the same speed as the truck below it.", "gt-answer": "B. driving faster than the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the truck is seen driving at different speeds, including slower than the truck below and faster than the truck below. This implies that the speed of the truck above cannot be the same as the truck below.", "chatgpt-answer": "C. driving at the same speed as the truck below", "video-llm-prediction": "The video showcases a truck driving on a highway, passing by a field of wheat. The truck is seen driving at different speeds, including slower than the truck below and faster than the truck below. The video captures the beauty of the wheat field and the tranquility of the highway.", "gt-answer": "B. driving faster than the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the truck above is driving at the same speed as the truck below.", "chatgpt-answer": "C. driving at the same speed as the truck below", "video-llm-prediction": "A truck is seen driving on a road with a field on either side. The truck is driving at the same speed as another truck below it.", "gt-answer": "B. driving faster than the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the truck is seen driving at different speeds, including slower than the truck below and faster than the truck below. Therefore, the correct answer is B. driving faster than the truck below.", "chatgpt-answer": "B. driving faster than the truck below", "video-llm-prediction": "The video showcases a truck driving on a highway, with the camera capturing the truck from different angles. The truck is seen driving at different speeds, including slower than the truck below and faster than the truck below. The video also captures the truck driving on a road with trees in the background.", "gt-answer": "B. driving faster than the truck below", "rating": 1 } ] }, "1084518106_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the truck is seen driving faster than another truck on the road. It also mentions that the truck is driving at the same speed as another truck on the road. Therefore, the correct answer is A. driving faster than the truck below.", "chatgpt-answer": "A. driving faster than the truck below", "video-llm-prediction": "The video shows a truck driving on a highway, passing by a field of wheat. The truck is seen driving faster than another truck on the road. The video also shows the truck driving at the same speed as another truck on the road.", "gt-answer": "B. driving slower than the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the truck above is shown driving at different speeds compared to the truck below. It specifically states that there are instances where the truck above is driving faster, slower, or at the same speed as the truck below.", "chatgpt-answer": "C. driving at the same speed as the truck below", "video-llm-prediction": "The video showcases a truck driving on a highway, passing by a field of wheat. The truck is seen driving at different speeds, with one instance showing it driving faster than the truck below, while another instance shows it driving slower than the truck below. The video also features a scene where the truck is driving at the same speed as the truck below. The field of wheat serves as a picturesque backdrop for the truck's journey, providing a serene and peaceful atmosphere. Overall, the video captures the beauty of the countryside and the tranquility", "gt-answer": "B. driving slower than the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the truck above is driving at the same speed as the truck below it.", "chatgpt-answer": "C. driving at the same speed as the truck below", "video-llm-prediction": "A truck is seen driving on a highway with a field on either side. The truck is driving at the same speed as the truck below it.", "gt-answer": "B. driving slower than the truck below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the truck above is seen driving at the same speed as the truck below it.", "chatgpt-answer": "C. driving at the same speed as the truck below", "video-llm-prediction": "A truck is seen driving on a highway, passing by a field of wheat. The truck is seen driving at the same speed as another truck below it.", "gt-answer": "B. driving slower than the truck below", "rating": 0 } ] }, "1062609286_concat_0": { "speed": [ { "chatgpt-reasoning": "The video description mentions that the battery charge above is increasing at a slower speed than the battery charge below.", "chatgpt-answer": "A. increasing at a slower speed than the battery charge below", "video-llm-prediction": "The video displays two different types of meters, one with a battery charge and the other with a battery charge and power. The video shows the battery charge increasing at a slower speed than the battery charge below.", "gt-answer": "C. increasing at the same speed as the battery charge below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the battery charge above is increasing at a slower speed than the battery charge below.", "chatgpt-answer": "A. increasing at a slower speed than the battery charge below", "video-llm-prediction": "The video displays two different battery charges, one above the other, with the battery charge above increasing at a slower speed than the battery charge below.", "gt-answer": "C. increasing at the same speed as the battery charge below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the battery charge above is increasing at a slower speed than the battery charge below.", "chatgpt-answer": "A. increasing at a slower speed than the battery charge below", "video-llm-prediction": "A video shows a battery charge increasing at a slower speed than the battery charge below.", "gt-answer": "C. increasing at the same speed as the battery charge below", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the battery charge starts at 100% and gradually decreases to 0%, indicating a decrease in battery charge. It also mentions that the battery charge at 50% and 75% is displayed, which means the battery charge is decreasing at a constant rate. Therefore, the battery charge above is decreasing at the same speed as the battery charge below.", "chatgpt-answer": "C. increasing at the same speed as the battery charge below", "video-llm-prediction": "The video showcases a car's battery charge, which starts at 100% and gradually decreases to 0%. The video also displays the battery charge at 50% and 75%.", "gt-answer": "C. increasing at the same speed as the battery charge below", "rating": 1 } ] }, "1062609286_concat_1": { "speed": [ { "chatgpt-reasoning": "The video description states that the first speed of charging is faster than the second speed. Additionally, it mentions that the car battery above is fully charged. Therefore, the battery charge above is increasing at a slower speed than the battery charge below.", "chatgpt-answer": "C. increasing at a slower speed than the battery charge below", "video-llm-prediction": "The video shows a car battery with two different speeds of charging. The first speed is faster than the second speed. The video also shows a car with a battery that is fully charged.", "gt-answer": "C. increasing at a slower speed than the battery charge below", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the battery charge above is increasing at a faster speed than the battery charge below.", "chatgpt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "The video displays two different types of battery charges, one with a faster speed and the other with a slower speed. The video also shows the battery charge above increasing at a faster speed than the battery charge below.", "gt-answer": "C. increasing at a slower speed than the battery charge below", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the battery charge above is increasing at a faster speed than the battery charge below.", "chatgpt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "The video shows a battery charge above and below a power meter. The battery charge above is increasing at a faster speed than the battery charge below.", "gt-answer": "C. increasing at a slower speed than the battery charge below", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there are two different speeds of battery charges displayed. It states that the first speed is increasing at a faster speed than the second speed. Therefore, we can conclude that the battery charge above is increasing at a faster speed than the battery charge below.", "chatgpt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "The video showcases a battery charge indicator with two different speeds displayed. The first speed is increasing at a faster speed than the second speed. The second speed is increasing at the same speed as the first speed. The video provides a visual representation of the battery charge indicator, highlighting the differences in the speed of the two charges.", "gt-answer": "C. increasing at a slower speed than the battery charge below", "rating": 0 } ] }, "1062609286_concat_2": { "speed": [ { "chatgpt-reasoning": "The video description clearly states that the battery charge above is increasing at a faster speed than the battery charge below. This indicates that the rate of increase for the battery charge above is higher compared to the battery charge below.", "chatgpt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "The video shows a battery charge increasing at a faster speed than the battery charge below.", "gt-answer": "A. increasing at a faster speed than the battery charge below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the battery charge above is increasing at a slower speed than the battery charge below. This indicates that the battery charge above is not increasing at a faster or same speed as the battery charge below.", "chatgpt-answer": "B. increasing at a slower speed than the battery charge below", "video-llm-prediction": "The video displays two different types of meters, one of which is a battery charge meter. The meter shows that the battery charge is increasing at a faster speed than the battery charge below. The video also shows that the battery charge is increasing at a slower speed than the battery charge above.", "gt-answer": "A. increasing at a faster speed than the battery charge below", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically states that the battery charge above is increasing at a faster speed than the battery charge below.", "chatgpt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "The video shows a car's battery charge above and below, with the battery charge above increasing at a faster speed than the battery charge below.", "gt-answer": "A. increasing at a faster speed than the battery charge below", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the battery charge above is increasing at a faster speed than the battery charge below.", "chatgpt-answer": "A. increasing at a faster speed than the battery charge below", "video-llm-prediction": "The video displays two different battery charges, one above the other, with the battery charge above increasing at a faster speed than the battery charge below. The video emphasizes the importance of battery life and the need to conserve energy.", "gt-answer": "A. increasing at a faster speed than the battery charge below", "rating": 1 } ] }, "1111601171_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the light on the building is gradually changing from blue to red and then to green.", "chatgpt-answer": "A. It is changing from blue to red.", "video-llm-prediction": "The video shows a large building with a blue light on it. The light gradually changes to red and then to green. The building is located in a city with other buildings in the background. The video captures the beauty of the building and its surroundings.", "gt-answer": "B. It is changing from blue to green.", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the sphere building is changing colors from blue to red, green, and back to blue.", "chatgpt-answer": "A. It is changing from blue to red.", "video-llm-prediction": "The video showcases a large sphere building that is changing colors from blue to red, green, and back to blue. The building is located in a city and is surrounded by other buildings. The video captures the beauty of the changing colors of the sphere building, making it a visually stunning sight.", "gt-answer": "B. It is changing from blue to green.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the sphere building is changing colors. It starts with blue, then changes to red, then green, and finally back to blue.", "chatgpt-answer": "B. It is changing from blue to green.", "video-llm-prediction": "The video shows a large sphere building in the middle of a city. The sphere is changing from blue to red, then to green, and finally back to blue.", "gt-answer": "B. It is changing from blue to green.", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the sphere building is changing colors from blue to red, green, and back to blue.", "chatgpt-answer": "A. It is changing from blue to red.", "video-llm-prediction": "The video showcases a large sphere building that is changing colors from blue to red, green, and back to blue. The building is located in a city at night, and the colors are changing in sync with the music. The video captures the beauty of the building and the city's nightlife.", "gt-answer": "B. It is changing from blue to green.", "rating": 0 } ] }, "1086105089_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the building is being constructed. Additionally, it mentions that the building is growing wider as the video progresses, which aligns with the process of construction.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "The video showcases a building being constructed, with a crane seen in the background. The building is growing wider as the video progresses.", "gt-answer": "C. demolishing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the building is being constructed and growing wider. The description mentions that the camera pans around the building to show the progress of the construction, which indicates that the building is being built.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "The video showcases a building that is being constructed, and it is growing wider. The camera pans around the building, and the viewer can see the progress of the construction. The building is made of glass and steel, and it is located in a city. The video also shows a cloudy sky, which adds to the overall aesthetic of the video.", "gt-answer": "C. demolishing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the construction of a building is being showcased. It starts with an outside view, transitions to an inside view, shows the outside again, and ends with another inside view. This implies that the building is in the process of being constructed.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "A video showcasing the construction of a building is presented. The video starts with a view of the building from the outside, and then transitions to a view of the building from the inside. The camera then shows the building from the outside, and the video ends with a view of the building from the inside.", "gt-answer": "C. demolishing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that a large building is being constructed. It also mentions that the size of the building is growing wider, indicating the progress in its construction.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "A large building is being constructed, and its size is growing wider.", "gt-answer": "C. demolishing", "rating": 0 } ] }, "1058498242_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the 3d pixels are changing from a flat surface to a cuboid and then back to a flat surface. This means that they are undergoing a transformation from one shape to another and then returning to the original shape.", "chatgpt-answer": "A. changing from a flat surface into a cuboid", "video-llm-prediction": "The video showcases a man sculpture that changes from a flat surface to a cuboid and then back to a flat surface. The video also features a white pillar that changes from a flat surface to a cuboid and then back to a flat surface.", "gt-answer": "D. changing from the shape of a man into a cuboid", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the 3D pixels are changing from a flat surface into a cuboid.", "chatgpt-answer": "A. changing from a flat surface into a cuboid", "video-llm-prediction": "The video showcases a statue of a man, which is made up of 3D pixels. The statue starts off as a flat surface and then transforms into a cuboid. The statue then changes back into the shape of a man. The video captures the intricate details of the statue and the transformation of the 3D pixels. The video is a testament to the artistry and craftsmanship of the sculptor.", "gt-answer": "D. changing from the shape of a man into a cuboid", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the 3D pixels are changing from a man sculpture into a cuboid and then back to a man sculpture.", "chatgpt-answer": "D. changing from the shape of a man into a cuboid", "video-llm-prediction": "A video showcases a man sculpture that changes into a cuboid and then back to a man sculpture.", "gt-answer": "D. changing from the shape of a man into a cuboid", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the statue made of 3D pixels changes from a flat surface into a cuboid and then back into a flat surface.", "chatgpt-answer": "A. changing from a flat surface into a cuboid", "video-llm-prediction": "A video showcases a statue of a man standing in front of a building, which is made of 3d pixels. The statue changes from a flat surface into a cuboid, and then back into a flat surface. The video also features a white pillar with a 1 on it.", "gt-answer": "D. changing from the shape of a man into a cuboid", "rating": 0 } ] }, "1082268005_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the Earth model is assembled and then disassembled, and it ends with the model splitting into two halves.", "chatgpt-answer": "C. splitting into two halves", "video-llm-prediction": "The video showcases a mesmerizing display of a 3D model of the Earth, which is made up of toy bricks. The model is assembled and then disassembled, and the video ends with the model splitting into two halves.", "gt-answer": "B. disassembling and disappearing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the model of the Earth is being constructed and deconstructed using Lego bricks. It specifically states that the camera pans around the model showcasing its intricate details, and then transitions to a scene where the model is being disassembled. The video concludes with a shot of the model being split into two halves. Hence, the correct answer is C. splitting into two halves.", "chatgpt-answer": "C. splitting into two halves", "video-llm-prediction": "The video showcases the process of constructing and deconstructing a model of the Earth using Lego bricks. The video begins with a close-up shot of the Lego model, followed by a zoomed-out shot of the model. The camera then pans around the model, showcasing its intricate details. The video then transitions to a scene where the model is being disassembled, with the camera focusing on the individual bricks as they are removed. The video concludes with a shot of the model being split into two halves, with the camera capturing the intricate details of", "gt-answer": "B. disassembling and disappearing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the planet earth made of toy bricks is disassembled and disappears. This means that the planet earth is being taken apart and ceases to exist.", "chatgpt-answer": "B. disassembling and disappearing", "video-llm-prediction": "A video showcases a planet earth made of toy bricks, which is then disassembled and disappears.", "gt-answer": "B. disassembling and disappearing", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the model of Earth is being assembled, disassembled, and split into two halves.", "chatgpt-answer": "C. splitting into two halves", "video-llm-prediction": "A video showcases the process of constructing and disassembling a model of the Earth using Lego bricks. The video begins with the model being assembled, followed by a scene where the model is disassembled and disappears. The video then transitions to a scene where the model splits into two halves. The video highlights the intricate details of the model and the precision required to assemble and disassemble it. The use of Lego bricks adds a unique and creative touch to the video, making it an engaging and visually appealing watch.", "gt-answer": "B. disassembling and disappearing", "rating": 0 } ] }, "1070711428_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the glacier is seen rising from the water and then breaking and falling into the water. It also mentions that the glacier is seen freezing and evaporating.", "chatgpt-answer": "B. breaking and falling in water", "video-llm-prediction": "The video showcases a glacier that is seen rising from the water and then breaking and falling into the water. The glacier is seen freezing and evaporating, and it is surrounded by water.", "gt-answer": "A. assembling and rising from water", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the glacier is rising from the water and falling into it, and also mentions the process of freezing and falling. This implies that the glacier is breaking and falling in water.", "chatgpt-answer": "B. breaking and falling in water", "video-llm-prediction": "A glacier is seen rising from the water and falling into it. The video captures the process of the glacier freezing and falling into the water.", "gt-answer": "A. assembling and rising from water", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the glacier is seen rising from the water, breaking and falling in the water, and freezing. This indicates that the glacier goes through a process of assembling and rising from water, breaking and falling in water, and freezing.", "chatgpt-answer": "A. assembling and rising from water", "video-llm-prediction": "A glacier is seen rising from the water, breaking and falling in the water, and freezing.", "gt-answer": "A. assembling and rising from water", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that one glacier is breaking and falling into the water, while another glacier is freezing and evaporating.", "chatgpt-answer": "B. breaking and falling in water", "video-llm-prediction": "A glacier is seen breaking and falling into the water, while another glacier is seen freezing and evaporating.", "gt-answer": "A. assembling and rising from water", "rating": 0 } ] }, "1057447372_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the stadium is illuminated with blue lights and a blue light shines on the field. This indicates that the brightness of the stadium is changing.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video showcases a large stadium with a green field and a blue sky in the background. The stadium is illuminated with blue lights, and the field is green. The video also features a blue light that shines on the field.", "gt-answer": "A. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the stadium is illuminated with blue lights, and the field is surrounded by a blue light. This indicates that the brightness of the stadium is increasing, so it is turning brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "The video showcases a large stadium with a green field and a blue sky in the background. The stadium is illuminated with blue lights, and the field is surrounded by a blue light. The video also features a blue light that illuminates the field.", "gt-answer": "A. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the field is illuminated by blue lights, indicating the stadium is well-lit. Therefore, the stadium is likely staying the same brightness.", "chatgpt-answer": "B. staying the same brightness", "video-llm-prediction": "A stadium with a large field of green grass is shown. The field is illuminated by blue lights, and the stadium is filled with people. The video ends with the stadium being shown again.", "gt-answer": "A. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the lights in the stadium are turning on and off. When the lights turn off, the stadium becomes darker. When the lights turn on, the stadium becomes brighter.", "chatgpt-answer": "C. turning brighter", "video-llm-prediction": "A stadium with a large audience is shown, and the lights begin to flash. The stadium is then shown with the lights turned off, and the audience is shown. The stadium is then shown with the lights turned on, and the audience is shown again.", "gt-answer": "A. turning darker", "rating": 0 } ] }, "1053334574_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the ink is squeezed out onto a surface and then shown spreading out and creating a pattern. This indicates that the ink is expanding from the center.", "chatgpt-answer": "D. expanding from the center", "video-llm-prediction": "The video showcases the process of creating a painting using black ink. The ink is first shown in a container and then squeezed out onto a surface to create a large splash. The ink is then shown spreading out and creating a pattern on the surface. The video also includes close-up shots of the ink spreading out and creating a pattern. The video ends with a shot of the ink spreading out and creating a pattern on the surface.", "gt-answer": "C. shrinking into the the center", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the ink is seen spreading out and creating a pattern on the canvas. This implies that the ink is expanding from its initial point.", "chatgpt-answer": "D. expanding from the center", "video-llm-prediction": "The video showcases the process of creating a painting using black ink. The artist starts by dipping a brush into the ink and then begins to paint on a canvas. The ink is seen spreading out and creating a pattern on the canvas. The artist continues to paint, and the ink spreads out and creates a larger pattern. The video ends with the artist finishing the painting.", "gt-answer": "C. shrinking into the the center", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the black ink is being used in different ways, such as being spilled on paper, creating a stain, and being used to create a painting and a drawing. These actions involve the ink moving or spreading in various directions.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video showcasing the different ways black ink can be used. The video starts with a close-up shot of black ink, which then transitions to a white background with the words \"black ink\" written on it. The video then shows several different ways black ink can be used, including being spilled on paper and creating a stain. The video also shows the ink being used to create a painting and a drawing. Throughout the video, the ink is shown in various colors and positions, including being squeezed out of a bottle and being poured onto a surface. The", "gt-answer": "C. shrinking into the the center", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the black ink is being used by a person to paint on a canvas. The video does not mention anything about the ink splitting, shrinking into the center, or expanding from the center. Therefore, the correct answer is that the black ink is staying in the same shape.", "chatgpt-answer": "A. staying in the same shape", "video-llm-prediction": "A video showcases the process of creating a painting using black ink. The video begins with a close-up shot of the ink, which then transitions to a person using a brush to paint on a canvas. The camera captures the brushstrokes as the person paints, and the video ends with a close-up shot of the finished painting.", "gt-answer": "C. shrinking into the the center", "rating": 0 } ] }, "1016172301_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the 3D house model is shown being demolished, then being constructed, and finally painted.", "chatgpt-answer": "A. being demolished, B. being constructed, C. being painted", "video-llm-prediction": "A 3D house model is shown being demolished, then being constructed, and finally painted.", "gt-answer": "A. being demolished", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the 3D house model is being constructed, painted, and then being demolished. It mentions the various stages of completion and the final stage of destruction.", "chatgpt-answer": "A. being demolished", "video-llm-prediction": "The video showcases a 3D house model being constructed, painted, and then being demolished. The model is shown in various stages of completion, with the final stage showing it being destroyed. The video provides a detailed look at the process of constructing a house, from the initial stages of building to the final stages of demolition. The viewer can see the intricate details of the model, including the roof, walls, and windows, as well as the various tools and equipment used in the construction process. Overall, the video provides a comprehensive overview of the process of constructing a house, from start to", "gt-answer": "A. being demolished", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the 3D house model is shown being demolished, then being constructed, and finally painted. Therefore, all three actions are happening to the 3D house model.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A 3D house model is shown being demolished, then being constructed, and finally painted.", "gt-answer": "A. being demolished", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the 3D house model is shown being demolished, then being constructed, and finally painted.", "chatgpt-answer": "C. being painted", "video-llm-prediction": "A 3D house model is shown being demolished, then being constructed, and finally painted.", "gt-answer": "A. being demolished", "rating": 0 } ] }, "1084736389_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the man's face is shown to be aging.", "chatgpt-answer": "A. Aging", "video-llm-prediction": "The video features a man with a beard who is shown in various close-up shots. The man is seen looking directly at the camera and appears to be in a state of distress. The video also includes several shots of the man's face, which is shown to be aging. The video ends with the man looking directly at the camera.", "gt-answer": "C. Morphing from a human into a chimpanzee", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man's face is the main focus of the video and that there is a scene where the man is morphed into a chimpanzee and then back into a human. Therefore, the correct answer is option B: Morphing from a chimpanzee into a human.", "chatgpt-answer": "B. Morphing from a chimpanzee into a human", "video-llm-prediction": "The video features a man with a beard and mustache, who is shown in various close-up shots. The man's face is the main focus of the video, and he is shown in different positions and angles. The video also includes a scene where the man is morphed into a chimpanzee and then back into a human. The video ends with the man looking directly at the camera.", "gt-answer": "C. Morphing from a human into a chimpanzee", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that there is a scene where the man is morphed into a chimpanzee and then back into a human. This implies that the face in the video is undergoing a transformation or morphing process.", "chatgpt-answer": "B. Morphing from a chimpanzee into a human", "video-llm-prediction": "The video features a man with a beard who is shown in various close-up shots. The video also includes a scene where the man is morphed into a chimpanzee and then back into a human. The video ends with the man looking directly at the camera.", "gt-answer": "C. Morphing from a human into a chimpanzee", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man's face is morphing into a chimpanzee and then back into a human. Therefore, the correct answer is B. Morphing from a chimpanzee into a human.", "chatgpt-answer": "B. Morphing from a chimpanzee into a human", "video-llm-prediction": "The video showcases a man's face morphing into a chimpanzee and then back into a human. The video starts with a close-up shot of the man's face, and then it morphs into a chimpanzee. The chimpanzee's face is then shown, and it morphs back into a human face. The video ends with the man's face shown again.", "gt-answer": "C. Morphing from a human into a chimpanzee", "rating": 0 } ] }, "1054494542_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the background changes from pink to green, and then back to pink.", "chatgpt-answer": "A. changing from pink to green", "video-llm-prediction": "The video shows a person holding up their hand and then making a fist. The background changes from pink to green, and then back to pink. The person then makes a fist again.", "gt-answer": "C. changing from blue to pink", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the background changes from pink to green and then back to pink.", "chatgpt-answer": "B. changing from green to pink", "video-llm-prediction": "The video features a person holding up their hand and making a fist. The background changes from pink to green, and then back to pink. The person then makes a fist again.", "gt-answer": "C. changing from blue to pink", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the background changes from pink to green and then back to pink.", "chatgpt-answer": "B. changing from green to pink", "video-llm-prediction": "A person is shown holding up their hand and making a fist. The background changes from pink to green and then back to pink.", "gt-answer": "C. changing from blue to pink", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the background changes from pink to green and then back to pink.", "chatgpt-answer": "A. changing from pink to green", "video-llm-prediction": "A person is shown holding up their hand and making a fist. The background changes from pink to green, and then back to pink. The person then makes a fist again.", "gt-answer": "C. changing from blue to pink", "rating": 0 } ] }, "1055194940_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the butterfly is transforming into a pupa and then transforming back into a butterfly. This indicates a process of metamorphosis where the insect goes through different stages.", "chatgpt-answer": "D. transforming from pupa into butterfly", "video-llm-prediction": "The video shows a butterfly transforming into a pupa and then transforming back into a butterfly.", "gt-answer": "A. transforming from butterfly into pupa", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the butterfly is transforming into a pupa and then transforming back into a butterfly.", "chatgpt-answer": "D. transforming from pupa into butterfly", "video-llm-prediction": "The video shows a butterfly transforming into a pupa and then transforming back into a butterfly.", "gt-answer": "A. transforming from butterfly into pupa", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the butterfly is shown in various stages of its life cycle - starting as a butterfly, then transforming into a pupa, and finally emerging as a butterfly again. This indicates that the insect is going through metamorphosis, transitioning from one form to another.", "chatgpt-answer": "A. transforming from butterfly into pupa", "video-llm-prediction": "A butterfly is seen hanging from a stick, and it is shown in various stages of its life cycle. It starts as a butterfly, then transforms into a pupa, and finally emerges as a butterfly again.", "gt-answer": "A. transforming from butterfly into pupa", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the butterfly is transforming into a pupa and then into a butterfly again. This indicates a complete life cycle of the insect, starting as a butterfly, transforming into a pupa, and then transforming back into a butterfly.", "chatgpt-answer": "D. transforming from pupa into butterfly", "video-llm-prediction": "The video shows a butterfly transforming into a pupa and then into a butterfly again.", "gt-answer": "A. transforming from butterfly into pupa", "rating": 0 } ] }, "1079384099_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the 3D pixel is transforming from a heart to a triangle, then to a white square, and finally to a flower.", "chatgpt-answer": "C. It is transforming from a white square into the shape of a flower", "video-llm-prediction": "The video showcases a 3D pixel transforming from a heart to a triangle, then to a white square, and finally to a flower. The video starts with a white screen displaying the words \"3D Pixel\" in the middle. The video then shows a 3D pixel transforming from the shape of a heart into a triangle. The next scene shows the same 3D pixel transforming from a triangle into the shape of a heart. The video then shows the same 3D pixel transforming from a white square into the shape of a flower. Finally, the video shows the same 3D pixel transform", "gt-answer": "D. It is transforming from the shape of a flower into a white square", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the 3D pixel is transforming from a heart to a triangle, and then back to a heart. None of the other choices match this description.", "chatgpt-answer": "A. It is transforming from the shape of a heart into a triangle", "video-llm-prediction": "The video showcases a 3D pixel transforming from a heart to a triangle, and then back to a heart. The video also features a 3D pixel transforming from a white square to a flower, and then back to a white square. The video is a visual representation of the transformation of a 3D pixel.", "gt-answer": "D. It is transforming from the shape of a flower into a white square", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the 3D pixel starts in the shape of a heart, then transforms into a triangle, followed by a flower, and finally, it transforms back into a white square. So, the correct answer is that it is transforming from the shape of a flower into a white square.", "chatgpt-answer": "D. It is transforming from the shape of a flower into a white square", "video-llm-prediction": "The video features a 3D pixel that transforms into various shapes, including a heart, triangle, and flower. The video starts with the pixel in the shape of a heart, and then it transforms into a triangle. The pixel then transforms into the shape of a flower, and finally, it transforms back into a white square.", "gt-answer": "D. It is transforming from the shape of a flower into a white square", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the 3D pixel is transforming from a heart to a triangle and then back to a heart.", "chatgpt-answer": "A. It is transforming from the shape of a heart into a triangle", "video-llm-prediction": "The video showcases a 3D pixel transforming from a heart to a triangle, and then back to a heart. The video also features a 3D pixel transforming from a white square to a flower and back to a white square. The video is a visual representation of the transformation of shapes and colors.", "gt-answer": "D. It is transforming from the shape of a flower into a white square", "rating": 0 } ] }, "1099811331_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the 3D heart gradually appears and disappears. It starts off small, grows in size, and then reduces back to a small size.", "chatgpt-answer": "D. Reducing in size", "video-llm-prediction": "The video features a 3D heart that gradually appears and disappears. The heart starts off small and gradually grows in size before gradually disappearing. The video showcases the heart's transformation from a small to a large size and back to a small size. The heart's gradual appearance and disappearance creates a mesmerizing visual effect that captivates the viewer's attention. The video's focus is solely on the heart's transformation, and there are no other objects or elements in the video. The heart's gradual appearance and disappearance creates a sense of anticipation and excitement, making", "gt-answer": "A. gradually disappearing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the 3D heart gradually appears and disappears, showcasing its growth and shrinkage. This indicates that the 3D heart is both growing in size and reducing in size.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a 3D heart that gradually appears and disappears, showcasing its growth and shrinkage.", "gt-answer": "A. gradually disappearing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the 3D heart is gradually appearing and then gradually disappearing. This indicates that the heart is going through a cycle of appearing and disappearing.", "chatgpt-answer": "B. gradually appearing", "video-llm-prediction": "The video shows a 3D heart gradually appearing and then gradually disappearing.", "gt-answer": "A. gradually disappearing", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the 3D heart gradually disappears, gradually appears, and gradually grows in size. This eliminates options C and D. Furthermore, it mentions that the heart is shown in various colors, including red and pink, which suggests that the heart is not reducing in size or changing colors.", "chatgpt-answer": "A. gradually disappearing", "video-llm-prediction": "The video features a 3D heart that gradually disappears, gradually appears, and gradually grows in size. The heart is shown in various colors, including red and pink. The video also includes a purple background with a heart-shaped shadow.", "gt-answer": "A. gradually disappearing", "rating": 1 } ] }, "1093340469_reverse": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the bathroom is well-lit, which indicates that there is sufficient lighting in the room. The description does not mention any changes in brightness, so it can be inferred that the room is staying the same brightness.", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a sink and mirror, and a towel rack. The bathroom is well-lit, and the sink is clean and well-maintained. The video also shows a person using the sink to wash their hands. The bathroom is clean and well-organized, with toiletries neatly arranged on the counter. The video provides a glimpse into the bathroom's design and functionality, highlighting its cleanliness and organization.", "gt-answer": "B. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the bathroom is well-lit with bright lighting. There is no mention of any changes in lighting, so it can be inferred that the room is staying the same brightness.", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a large mirror and a sink. The bathroom is well-lit, and the mirror is clean and clear. The sink is made of marble and is located under the mirror. The bathroom has a white color scheme, and the lighting is bright. The video also shows a bookshelf with several books on it. The video is shot from a fixed camera angle, and the background music is calming and relaxing. Overall, the video provides a peaceful and serene atmosphere, making it an ideal video for relaxation.", "gt-answer": "B. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the room is well-lit, and there is no information indicating any changes in brightness throughout the video.", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a sink and mirror, and a towel rack. The room is well-lit and has a white color scheme. The video starts with a close-up shot of the sink and mirror, and then pans out to show the entire bathroom. The camera then focuses on the sink and mirror again, before panning out again to show the entire bathroom. The video ends with a shot of the towel rack.", "gt-answer": "B. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the bathroom is well-lit. If the room is well-lit, it means that it is already bright. Therefore, the brightness would stay the same.", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a sink and mirror, and a towel rack. The bathroom is well-lit, and the sink is made of marble. The video also features a person washing their hands in the sink.", "gt-answer": "B. turning brighter", "rating": 0 } ] }, "1111601171": { "attribute_change": [ { "chatgpt-reasoning": "The video description describes that the sphere on top of the building is changing from green to blue and then to red.", "chatgpt-answer": "C. It is changing from blue to red.", "video-llm-prediction": "The video shows a large building with a blue sphere on top of it. The sphere is changing from green to blue and then to red. The building is located in a city with other buildings and a Ferris wheel in the background. The video captures the beauty of the building and its surroundings at night.", "gt-answer": "A. It is changing from green to blue.", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the sphere building is changing from green to blue, and then back to green again.", "chatgpt-answer": "A. It is changing from green to blue.", "video-llm-prediction": "The video showcases a large sphere building that is changing from green to blue, and then back to green again. The building is located in a city at night, and the video captures the changing colors of the building in a mesmerizing display.", "gt-answer": "A. It is changing from green to blue.", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the building is changing from green to blue and then to red.", "chatgpt-answer": "C. It is changing from blue to red.", "video-llm-prediction": "The video shows a large blue sphere building in the middle of a city. The building is changing from green to blue and then to red. The video captures the beauty of the city at night.", "gt-answer": "A. It is changing from green to blue.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the building is changing colors from green to blue and then back to green again.", "chatgpt-answer": "A. It is changing from green to blue.", "video-llm-prediction": "The video showcases a large sphere building that is changing colors from green to blue and then back to green again. The building is located in a city with a Ferris wheel in the background. The video captures the beauty of the changing colors of the building and the vibrant cityscape.", "gt-answer": "A. It is changing from green to blue.", "rating": 1 } ] }, "1086105089": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the building is \"under construction\" and the camera pans around the building capturing its \"growing wider\". This indicates that the building is currently being constructed and expanding in width.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "The video showcases a building under construction, with a crane visible in the background. The camera pans around the building, capturing its growing wider. The video also features a cloudy sky, with a blue sky visible in the background.", "gt-answer": "A. being constructed", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that a building is being constructed in the video, showing the progress of the construction. This indicates that the building is not being demolished or growing wider, but rather it is in the process of being constructed.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "A large building is being constructed in the video, and the camera pans around the building, showing the progress of the construction. The building is being constructed in a cloudy sky, and the camera captures the progress of the construction. The building is being constructed in a cloudy sky, and the camera captures the progress of the construction.", "gt-answer": "A. being constructed", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that a building is being constructed. None of the other choices, such as demolishing or growing wider, are mentioned in the video description.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "A building is being constructed in a cloudy sky.", "gt-answer": "A. being constructed", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the building is under construction and a crane is lifting a beam into place. Furthermore, the camera pans around the building to highlight its growing width. These details indicate that the building is being constructed and growing wider.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "A video showcases a building under construction, with a crane lifting a beam into place. The camera pans around the building, highlighting its growing width.", "gt-answer": "A. being constructed", "rating": 1 } ] }, "1058498242": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the sculpture is initially displayed as a flat surface, then it changes into a cuboid and finally back into the shape of a man. This implies that the transformation starts from a flat surface and ends with the shape of a man, with the intermediate stage being a cuboid.", "chatgpt-answer": "C. changing from a cuboid into the shape of a man", "video-llm-prediction": "The video showcases a white sculpture of a man that is initially displayed as a flat surface. The sculpture then changes into a cuboid and then back into the shape of a man. The video emphasizes the transformation of the sculpture from a flat surface to a three-dimensional object.", "gt-answer": "C. changing from a cuboid into the shape of a man", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sculpture initially starts as a flat surface, changes into a cuboid, and then returns to its original state. So, the 3D pixels are changing from a flat surface into a cuboid.", "chatgpt-answer": "D. changing from a flat surface into a cuboid", "video-llm-prediction": "The video showcases a white sculpture of a man that is initially displayed as a flat surface. The sculpture then changes into a cuboid, and the man's arms are raised. The video ends with the sculpture returning to its original state.", "gt-answer": "C. changing from a cuboid into the shape of a man", "rating": 0 }, { "chatgpt-reasoning": "From the video description, it is mentioned that the sculpture of a man is changing from a flat surface into a cuboid and then changing into a man again. This means that the 3D pixels are changing from a flat surface into a cuboid and then into the shape of a man.", "chatgpt-answer": "C. changing from a cuboid into the shape of a man", "video-llm-prediction": "A video showcasing a white sculpture of a man changing from a flat surface into a cuboid and then changing into a man again.", "gt-answer": "C. changing from a cuboid into the shape of a man", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sculpture made of 3D pixels changes from a flat surface to a cuboid and back again.", "chatgpt-answer": "A. changing from a cuboid into a flat surface", "video-llm-prediction": "The video showcases a white sculpture of a man in a room with a white wall. The sculpture is made of 3D pixels and changes from a flat surface to a cuboid and back again. The video also features a white statue of a man in a room with a white wall.", "gt-answer": "C. changing from a cuboid into the shape of a man", "rating": 0 } ] }, "1082268005": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the planet earth made of toy bricks is being disassembled and disappearing. Additionally, it also mentions that the same planet earth is splitting into two halves.", "chatgpt-answer": "B. disassembling and disappearing", "video-llm-prediction": "The video shows a planet earth made of toy bricks, which is then disassembled and disappears. The video also shows the same planet earth splitting into two halves.", "gt-answer": "A. assembling from toy bricks", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the process shown in the video is constructing and deconstructing a model of the Earth using Lego bricks.", "chatgpt-answer": "A. assembling from toy bricks", "video-llm-prediction": "The video showcases the process of constructing and deconstructing a model of the Earth using Lego bricks. The video begins with a close-up shot of the model, followed by a sequence of clips that demonstrate the process of constructing the model. The model is then deconstructed, and the process is shown again in reverse. The video ends with a final shot of the model.", "gt-answer": "A. assembling from toy bricks", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the planet earth made of toy bricks is being disassembled and disappearing.", "chatgpt-answer": "B. disassembling and disappearing", "video-llm-prediction": "A video showcases a planet earth made of toy bricks, which is then disassembled and disappears.", "gt-answer": "A. assembling from toy bricks", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the planet earth made of toy bricks is being disassembled and disappears.", "chatgpt-answer": "B. disassembling and disappearing", "video-llm-prediction": "The video showcases a mesmerizing display of a planet earth made of toy bricks, which is then disassembled and disappears. The video also features a unique visual of a blue and white globe, which is then split into two halves. The video captures the intricate details of the toy bricks and the smooth transitions between the different scenes.", "gt-answer": "A. assembling from toy bricks", "rating": 0 } ] }, "1070711428": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the glacier is breaking and falling into the water, creating a stunning display.", "chatgpt-answer": "A. breaking and falling in water", "video-llm-prediction": "The video showcases a glacier breaking and falling into the water, creating a stunning display of ice and water. The glacier is seen breaking apart and falling into the water, creating a dramatic scene. The video also shows the glacier freezing and rising from the water, creating a beautiful and serene landscape.", "gt-answer": "A. breaking and falling in water", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the glacier is breaking and falling into the water, as well as assembling and rising from the water. It also mentions that the glacier is freezing and evaporating.", "chatgpt-answer": "A. breaking and falling in water", "video-llm-prediction": "The video showcases a glacier that is breaking and falling into the water. The glacier is seen assembling and rising from the water, and it is also shown freezing and evaporating. The video captures the beauty and power of nature.", "gt-answer": "A. breaking and falling in water", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the glacier is seen breaking and falling into the water, then assembling and rising from the water. This suggests a cyclical process of breaking, falling, assembling, and rising.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A glacier is seen breaking and falling into the water, then assembling and rising from the water.", "gt-answer": "A. breaking and falling in water", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the glacier is breaking and falling into the water, then assembling and rising from the water. Therefore, the correct answer should indicate this sequence of events.", "chatgpt-answer": "A. breaking and falling in water", "video-llm-prediction": "A glacier is seen breaking and falling into the water, then assembling and rising from the water.", "gt-answer": "A. breaking and falling in water", "rating": 1 } ] }, "1057447372": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the lights of the stadium turn darker, brighter, and stay the same brightness.", "chatgpt-answer": "C. staying the same brightness", "video-llm-prediction": "A stadium with a green field and blue lights. The lights turn darker, brighter, and stay the same brightness.", "gt-answer": "B. turning brighter", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the stadium is illuminated with blue lights and there is a large blue light that illuminates the field. This suggests that the stadium is turning brighter.", "chatgpt-answer": "B. turning brighter", "video-llm-prediction": "The video showcases a large stadium with a green field and a blue sky in the background. The stadium is illuminated with blue lights, and the field is surrounded by a blue wall. The video also features a large blue light that illuminates the field.", "gt-answer": "B. turning brighter", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the stadium has blue lights. If the blue lights are turned on, it would make the stadium brighter.", "chatgpt-answer": "B. turning brighter", "video-llm-prediction": "A stadium with a green field and blue lights.", "gt-answer": "B. turning brighter", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the lights in the stadium turn darker, brighter, and stay the same brightness.", "chatgpt-answer": "C. staying the same brightness", "video-llm-prediction": "A stadium with a green field and blue lights is shown. The lights turn darker, brighter, and stay the same brightness.", "gt-answer": "B. turning brighter", "rating": 0 } ] }, "1053334574": { "attribute_change": [ { "chatgpt-reasoning": "The video description states that the black ink is being spread out and creating a painting. This implies that the black ink is expanding from the center to cover the canvas.", "chatgpt-answer": "D. expanding from the center", "video-llm-prediction": "A video showcases the process of creating a painting using black ink. The video starts with a close-up shot of the ink, which then transitions to a canvas where the ink is spread out. The ink is then shown spreading out and creating a painting. The video ends with a close-up shot of the finished painting. The video highlights the process of creating a painting using black ink, from the initial spreading of the ink to the final product. The video is informative and visually appealing, making it an excellent resource for anyone interested in painting.", "gt-answer": "D. expanding from the center", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the ink is first shown spreading out on a surface and then used to create a painting. This indicates that the ink is expanding from its initial position.", "chatgpt-answer": "D. expanding from the center", "video-llm-prediction": "The video showcases the process of creating a painting using black ink. The ink is first shown spreading out on a surface, then it is used to create a painting. The video also features close-up shots of the ink spreading and painting on the surface. The final result is a beautiful painting created using black ink.", "gt-answer": "D. expanding from the center", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the black ink is shown shrinking into the center, splitting in half, and expanding from the center.", "chatgpt-answer": "B. shrinking into the center, C. splitting in half, and D. expanding from the center", "video-llm-prediction": "A video showcasing the different ways black ink can be used. The video starts with a close-up shot of black ink, and then shows several clips of the ink being used in different ways. The ink is shown shrinking into the center, splitting in half, and expanding from the center. The video ends with a shot of the ink being used in a different way.", "gt-answer": "D. expanding from the center", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the black ink is shown to spread out from a close-up shot to fill the entire canvas. This suggests that the ink is expanding from the center.", "chatgpt-answer": "D. expanding from the center", "video-llm-prediction": "A video showcases the process of creating a painting using black ink. The video begins with a close-up shot of black ink, which then transitions to a canvas where the ink is spread out. The camera then pans out to reveal the entire painting, which is a portrait of a woman. The painting is then shown in various stages of completion, with the ink gradually spreading out to fill the entire canvas. The video ends with a shot of the completed portrait.", "gt-answer": "D. expanding from the center", "rating": 1 } ] }, "1016172301": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the 3D house model is being constructed, painted, and then demolished. This indicates that all three activities are happening to the model.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "The video shows a 3D house model being constructed, painted, and then demolished. The model is shown in different stages of construction, including a red roof and a white exterior. The video also includes a close-up of the model.", "gt-answer": "A. being constructed", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the 3D house model is being constructed, painted, and then demolished. It describes the various stages of completion, from building the foundation to the final demolition.", "chatgpt-answer": "C. being demolished", "video-llm-prediction": "The video showcases a 3D house model being constructed, painted, and then demolished. The model is shown in various stages of completion, with the final stage showing the house being demolished. The video provides a detailed look at the construction process, from the initial stages of building the foundation to the final stages of demolition. The viewer can see the intricate details of the house model, including the windows, doors, and other architectural features. The video is an excellent resource for anyone interested in learning about the construction process or for those who want to see the process in action.", "gt-answer": "A. being constructed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the 3D house model is being constructed, painted, and demolished.", "chatgpt-answer": "A. being constructed, B. being painted, C. being demolished", "video-llm-prediction": "A 3D house model is being constructed, painted, and demolished in a video.", "gt-answer": "A. being constructed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that a 3D house model is being constructed. Additionally, it specifies that the roof is being painted red, indicating that the process of painting is happening within the construction.", "chatgpt-answer": "A. being constructed", "video-llm-prediction": "A 3D house model is being constructed, and the roof is being painted red.", "gt-answer": "A. being constructed", "rating": 1 } ] }, "1084736389": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the man is shown morphing into a chimpanzee and into a human. This indicates that the face in the video is undergoing a transformation or morphing process.", "chatgpt-answer": "B. Morphing from a chimpanzee into a human", "video-llm-prediction": "The video features a man with a beard and a mustache, who is shown in various close-up shots. The man is seen looking directly at the camera, and in some shots, he is wearing a black shirt. The video also includes a scene where the man is seen morphing into a chimpanzee, and in another scene, he is shown morphing into a human. The video ends with the man looking directly at the camera.", "gt-answer": "B. Morphing from a chimpanzee into a human", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is shown morphing into a chimpanzee and then back into a human. This indicates that the face is undergoing a transformation, rather than just aging or becoming younger.", "chatgpt-answer": "B. Morphing from a chimpanzee into a human", "video-llm-prediction": "The video features a man with a beard who is shown in various close-up shots. The man is seen looking directly at the camera and appears to be in a state of agitation. The video also includes a scene where the man is shown morphing into a chimpanzee and then back into a human. The video seems to be exploring themes of aging and transformation.", "gt-answer": "B. Morphing from a chimpanzee into a human", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the video is focused on the man's facial expressions and his interaction with the camera. There is no indication or mention of any morphing or age-related changes happening to the face in the video. Therefore, choices B and D can be eliminated. Additionally, there is no mention of the man's face becoming younger or aging. However, it is mentioned that the man is shown looking at the camera and then looking away multiple times. This suggests a change in his gaze direction, not a physical transformation of the face. Hence, I choose:", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a man with a beard and a mustache, who is shown in various close-up shots. The video starts with the man looking directly at the camera, and then he is shown looking away. The man is then shown looking at the camera again, and the video ends with him looking away once more. The video seems to be focused on the man's facial expressions and his interaction with the camera.", "gt-answer": "B. Morphing from a chimpanzee into a human", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is shown in various close-up shots, looking directly at the camera, and ends with him looking away. There is no mention of any morphing or aging happening to the face. Therefore, choices B and D can be eliminated. Since there is no information about the person becoming younger, choice C can also be eliminated. Thus, the most reasonable answer is A - Aging.", "chatgpt-answer": "A. Aging", "video-llm-prediction": "The video features a man with a beard and a mustache, who is shown in various close-up shots. The man is seen looking directly at the camera, and the video ends with him looking away.", "gt-answer": "B. Morphing from a chimpanzee into a human", "rating": 0 } ] }, "1054494542": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the background changes from pink to green and then to blue.", "chatgpt-answer": "A. changing from pink to green", "video-llm-prediction": "The video features a woman holding up her hand and making a fist. The background changes from pink to green and then to blue. The woman continues to make a fist and hold her hand up.", "gt-answer": "B. changing from pink to blue", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the background changes from pink to green, then back to pink, and finally to blue.", "chatgpt-answer": "B. changing from pink to blue", "video-llm-prediction": "The video features a person holding up their hand and making a fist. The background changes from pink to green, and then back to pink. The person then makes a fist again and the background changes to blue. The video ends with the person making a fist one last time.", "gt-answer": "B. changing from pink to blue", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the background changes from pink to green and then back to pink. It also mentions that the background changes from pink to blue. Therefore, the correct answer is B. changing from pink to blue.", "chatgpt-answer": "B. changing from pink to blue", "video-llm-prediction": "The video shows a person holding up their hand and then making a fist. The background changes from pink to green and then back to pink. The person then makes a fist again and the background changes from pink to blue.", "gt-answer": "B. changing from pink to blue", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the background changes from pink to green, and then back to pink.", "chatgpt-answer": "A. changing from pink to green", "video-llm-prediction": "The video features a person holding up their hand and making a fist. The background changes from pink to green, and then back to pink. The person then makes a fist again.", "gt-answer": "B. changing from pink to blue", "rating": 0 } ] }, "1055194940": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the butterfly is transforming from a pupa into a butterfly. It mentions that the butterfly is hanging from a stick and then it starts to move its wings, indicating the transformation process.", "chatgpt-answer": "C. transforming from pupa into butterfly", "video-llm-prediction": "The video shows a butterfly transforming from a pupa into a butterfly. The butterfly is seen hanging from a stick and then it starts to move its wings. The video also shows the butterfly hanging from a string and a stick.", "gt-answer": "C. transforming from pupa into butterfly", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the butterfly is transforming from a pupa into a butterfly. It mentions the butterfly hanging and then transforming, indicating the process of metamorphosis.", "chatgpt-answer": "C. transforming from pupa into butterfly", "video-llm-prediction": "The video showcases a butterfly transforming from a pupa into a butterfly. The butterfly is seen hanging from a stick and then transforming into a butterfly. The video provides a glimpse into the life cycle of a butterfly, from its pupa stage to its adult stage. The butterfly's wings are vibrant and colorful, adding to the beauty of the video. The video is a great example of the transformation process of a butterfly and the importance of biodiversity.", "gt-answer": "C. transforming from pupa into butterfly", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically mentions that the butterfly is transforming into a pupa. This means that it is undergoing a process of metamorphosis and changing from a butterfly into a pupa.", "chatgpt-answer": "C. transforming from pupa into butterfly", "video-llm-prediction": "A butterfly is seen hanging from a stick, and it starts to transform into a pupa.", "gt-answer": "C. transforming from pupa into butterfly", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the butterfly is transforming from a pupa into a butterfly. It starts by hanging from a stick and then moves its wings. This indicates the transformation process.", "chatgpt-answer": "C. transforming from pupa into butterfly", "video-llm-prediction": "The video captures a butterfly transforming from a pupa into a butterfly. The butterfly is seen hanging from a stick and then it starts to move its wings. The video also shows the butterfly hanging from a string and then flying away.", "gt-answer": "C. transforming from pupa into butterfly", "rating": 1 } ] }, "1079384099": { "attribute_change": [ { "chatgpt-reasoning": "The video description clearly states that the 3D pixel is transforming from a white square into the shape of a flower. No other option matches this description.", "chatgpt-answer": "A. It is transforming from a white square into the shape of a flower", "video-llm-prediction": "The video showcases a 3D pixel transforming into various shapes, including a flower, heart, and triangle. The video begins with a white square, which then transforms into a flower. The flower then transforms into a heart, and finally, it transforms back into a white square. The video highlights the fluidity and versatility of 3D pixels, as they can be transformed into different shapes and forms. The video is a testament to the creativity and imagination that can be achieved through the use of 3D pixels.", "gt-answer": "A. It is transforming from a white square into the shape of a flower", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the 3D pixel is transforming into various shapes, including a flower and a heart. It starts with a white square and transforms into a flower, then into a heart. It also transforms into a triangle and then back into a heart. Finally, it transforms back into a white square.", "chatgpt-answer": "A. It is transforming from a white square into the shape of a flower", "video-llm-prediction": "The video showcases a 3D pixel transforming into various shapes, including a flower and a heart. The video starts with a white square, which then transforms into a flower, and then into a heart. The video then shows the same 3D pixel transforming into a triangle and then back into a heart. The video ends with the same 3D pixel transforming into a white square.", "gt-answer": "A. It is transforming from a white square into the shape of a flower", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the 3D pixel is transforming into a flower, heart, and triangle. It starts as a white square and ends as a white square, so it does not transform into a white square.", "chatgpt-answer": "A. It is transforming from a white square into the shape of a flower", "video-llm-prediction": "A video showcases a 3D pixel transforming into a flower, heart, and triangle, and then back into a white square.", "gt-answer": "A. It is transforming from a white square into the shape of a flower", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the 3D pixel is transforming into various shapes, including a heart, triangle, and flower. It is important to note that the video ends with the pixel transforming back into a white square.", "chatgpt-answer": "D. It is transforming from the shape of a flower into a white square", "video-llm-prediction": "A video showcases a 3D pixel transforming into various shapes, including a heart, triangle, and flower. The video highlights the transformation of the pixel into different shapes, with each shape being displayed on a pink background. The video ends with the pixel transforming back into a white square.", "gt-answer": "A. It is transforming from a white square into the shape of a flower", "rating": 0 } ] }, "1099811331": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the 3D heart is gradually appearing and gradually disappearing. None of the other options (reducing in size, growing in size) are mentioned in the description.", "chatgpt-answer": "C. gradually appearing", "video-llm-prediction": "The video features a 3D heart that gradually appears and gradually disappears. The heart is shown in different colors, including red and pink. The video also includes a purple background and a purple heart.", "gt-answer": "C. gradually appearing", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the 3D heart gradually appears and gradually disappears. This indicates that there is a transition happening with the heart in terms of visibility.", "chatgpt-answer": "B. gradually disappearing", "video-llm-prediction": "The video features a 3D heart that gradually appears and gradually disappears. The heart is shown in different colors, including red and pink. The video also includes a purple background and a purple heart.", "gt-answer": "C. gradually appearing", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the 3D heart gradually appears and gradually disappears. This means that the size of the heart remains constant, but it goes from being invisible to visible and then back to invisible again.", "chatgpt-answer": "C. gradually appearing", "video-llm-prediction": "A 3D heart gradually appears and gradually disappears.", "gt-answer": "C. gradually appearing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the 3D heart gradually appears and then gradually disappears. This implies that the 3D heart is undergoing a process of appearing and then disappearing.", "chatgpt-answer": "C. gradually appearing", "video-llm-prediction": "A video showcases a 3D heart that gradually appears and then gradually disappears.", "gt-answer": "C. gradually appearing", "rating": 1 } ] }, "1093340469": { "attribute_change": [ { "chatgpt-reasoning": "The video description mentions that the room is dimly lit. Therefore, we can infer that the room is turning darker.", "chatgpt-answer": "C. turning darker", "video-llm-prediction": "The video showcases a bathroom with a sink, mirror, and towel rack. The room is dimly lit, and the camera pans around the bathroom. The video ends with a shot of the bathroom door.", "gt-answer": "C. turning darker", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the bathroom is well-lit, indicating that it is already bright. There is no information suggesting that the brightness of the room changes.", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a sink, mirror, and storage. The bathroom is well-lit, and the sink is made of marble. The video also features a black and white photo of a bathroom with a sink and mirror.", "gt-answer": "C. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the room is consistently bright with no significant changes in lighting. This indicates that the brightness of the room is staying the same.", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a sink, mirror, and towel rack. The room is consistently bright, with no significant changes in lighting.", "gt-answer": "C. turning darker", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the bathroom is well-lit. Therefore, the correct answer is:", "chatgpt-answer": "A. staying the same brightness", "video-llm-prediction": "The video showcases a bathroom with a sink, mirror, and storage. The bathroom is well-lit and features a black and white color scheme. The video also includes a shot of a person taking a picture in the bathroom.", "gt-answer": "C. turning darker", "rating": 0 } ] }, "1059072773_1059718130_0": { "order": [ { "chatgpt-reasoning": "The video description states that the sun rises first, followed by the ice cream melting, and then ends with the sun rising again.", "chatgpt-answer": "A. Sun rising and then ice cream melting", "video-llm-prediction": "The video starts with a sun rising, and then it shows ice cream melting. The video ends with the sun rising again.", "gt-answer": "C. Sun rising and ice cream melting at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with the ice cream melting and then the sun rises in the background. Therefore, the correct order of events in the video is B. Ice cream melting and then sun rising.", "chatgpt-answer": "B. Ice cream melting and then sun rising", "video-llm-prediction": "The video showcases the melting of ice cream on a pink background, with the sun rising in the distance. The video starts with the ice cream melting, and the sun rises in the background, creating a serene and calming atmosphere. The video captures the beauty of nature and the simplicity of everyday moments. The melting ice cream represents the impermanence of things and the passage of time, while the sun rising symbolizes the renewal of hope and the beginning of a new day. The video is a reminder to appreciate the beauty of the world around us and to find joy in", "gt-answer": "C. Sun rising and ice cream melting at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the sun rises over the beach first, followed by a close-up of ice cream melting, and then ends with the sun rising again. This means that the order of events in the video is: Sun rising and then ice cream melting.", "chatgpt-answer": "A. Sun rising and then ice cream melting", "video-llm-prediction": "The video shows a sun rising over a beach, followed by a close-up of ice cream melting. The video ends with the sun rising again.", "gt-answer": "C. Sun rising and ice cream melting at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"The ice cream melts slowly, and the sun rises in the background.\" This indicates that the order of events is first the ice cream melting and then the sun rising.", "chatgpt-answer": "B. Ice cream melting and then sun rising", "video-llm-prediction": "The video showcases the melting of ice cream against a backdrop of a sunset. The ice cream melts slowly, and the sun rises in the background, creating a serene and calming atmosphere. The video captures the beauty of nature and the simplicity of everyday moments.", "gt-answer": "C. Sun rising and ice cream melting at the same time", "rating": 0 } ] }, "1059072773_1059718130_1": { "order": [ { "chatgpt-reasoning": "The video description provides a clear sequence of events. It starts with a close-up shot of a scoop of ice cream melting, followed by the camera panning out to show the sun rising in the background. The ice cream then melts again, and the sun rises once more. The video ends with the sun rising one last time. Therefore, the correct order of events is B. Sun rising and then ice cream melting.", "chatgpt-answer": "B. Sun rising and then ice cream melting", "video-llm-prediction": "The video starts with a close-up shot of a scoop of ice cream on a pink background. The ice cream is then shown melting, and the camera pans out to show the sun rising in the background. The video then shows the ice cream melting again, and the sun rising once more. The video ends with the sun rising one last time.", "gt-answer": "C. Ice cream melting and then sun rising", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the melting of the ice cream and the rising of the sun are happening simultaneously.", "chatgpt-answer": "A. Sun rising and ice cream melting at the same time", "video-llm-prediction": "The video showcases the melting of ice cream and the rising of the sun, both occurring simultaneously. The ice cream melts in a bowl, and the sun rises in the sky, creating a visually stunning scene. The video captures the contrast between the cold, creamy texture of the ice cream and the warm, golden hues of the sunrise. The viewer can appreciate the beauty of nature's contrasting elements in this video.", "gt-answer": "C. Ice cream melting and then sun rising", "rating": 0 }, { "chatgpt-reasoning": "The video description indicates that the sequence of events starts with a close-up of ice cream melting, followed by a sun rising, and ends with a sun setting.", "chatgpt-answer": "C. Ice cream melting and then sun rising", "video-llm-prediction": "The video shows a close-up of ice cream melting on a pink surface, followed by a sun rising. The video ends with the sun setting.", "gt-answer": "C. Ice cream melting and then sun rising", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the sun is rising first, followed by the ice cream melting. There is no mention of the ice cream melting before the sun rises.", "chatgpt-answer": "B. Sun rising and then ice cream melting", "video-llm-prediction": "The video captures the mesmerizing sight of a sunrise, with the sun peeking over the horizon and casting a warm glow over the landscape. As the sun rises, the camera pans to a close-up shot of a scoop of ice cream, which begins to melt and drip down the side of the scoop. The contrast between the warmth of the sunrise and the coldness of the ice cream creates a visually striking scene. The video then transitions to a shot of the sun setting, with the sun dipping below the horizon and casting a cool blue", "gt-answer": "C. Ice cream melting and then sun rising", "rating": 0 } ] }, "1059072773_1059718130_2": { "order": [ { "chatgpt-reasoning": "The video description states that the video starts with a beautiful sunrise, then it shows the ice cream melting, and finally ends with the sun rising again. This indicates that the correct order of events in the video is B) Sun rising and then ice cream melting.", "chatgpt-answer": "B. Sun rising and then ice cream melting", "video-llm-prediction": "The video starts with a beautiful sunrise, and then it shows a scoop of ice cream melting on a pink surface. The ice cream is dripping down, and the camera captures the melted ice cream as it drips down. The video then shows the ice cream melting completely, and the camera captures the entire process. The video ends with the sun rising again. Overall, the video showcases the process of ice cream melting and the beauty of the sunrise.", "gt-answer": "B. Sun rising and then ice cream melting", "rating": 1 }, { "chatgpt-reasoning": "From the video description, it is mentioned that the ice cream is seen melting on a pink surface and the sun is seen rising in the background. It also mentions that the video captures the contrast between the coldness of the ice cream and the warmth of the sun. Based on this information, we can conclude that the order of events in the video is: Ice cream melting and then sun rising.", "chatgpt-answer": "C. Ice cream melting and then sun rising", "video-llm-prediction": "The video showcases the process of ice cream melting and the sun rising. The ice cream is seen melting on a pink surface, and the sun is seen rising in the background. The video captures the contrast between the coldness of the ice cream and the warmth of the sun. The melting ice cream creates a pool of liquid, which gradually spreads across the surface. The video also highlights the beauty of nature, as the sun rises and casts its warm glow over the landscape. Overall, the video is a visual treat that captures the beauty of nature and the", "gt-answer": "B. Sun rising and then ice cream melting", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the sun rises first and then the ice cream melts. Therefore, the correct answer is B. Sun rising and then ice cream melting.", "chatgpt-answer": "B. Sun rising and then ice cream melting", "video-llm-prediction": "The video shows a sun rising and then ice cream melting. The ice cream is seen melting on a pink surface, and the video ends with the sun rising.", "gt-answer": "B. Sun rising and then ice cream melting", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the sun rises gradually and the ice cream melts slowly. It implies that the sun rising happens before the ice cream melting.", "chatgpt-answer": "B. Sun rising and then ice cream melting", "video-llm-prediction": "The video showcases the process of ice cream melting and the sun rising simultaneously. The ice cream melts slowly, and the sun rises gradually, creating a serene and calming atmosphere. The video captures the beauty of nature and the simplicity of everyday moments.", "gt-answer": "B. Sun rising and then ice cream melting", "rating": 1 } ] }, "1024867412_1034049020_0": { "order": [ { "chatgpt-reasoning": "The video description clearly states that both the girl and the dog are simultaneously engaged in their respective actions. This implies that they are performing the actions at the same time.", "chatgpt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A girl is walking on the street while a dog is simultaneously driving.", "gt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "rating": 1 }, { "chatgpt-reasoning": "The description mentions that the girl is walking on the street while a dog is simultaneously driving. This indicates that both actions are happening at the same time, so option A is the correct answer.", "chatgpt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A girl is walking on the street while a dog is simultaneously driving. The dog is seen in a car, and the girl is walking on the sidewalk. The dog is wearing sunglasses and a hat, and the girl is wearing a denim jacket and sunglasses. The dog is also holding a cell phone in its mouth.", "gt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that both events are happening simultaneously, meaning they are occurring at the same time. Therefore, the correct answer is A.", "chatgpt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A girl is walking on the street while a dog is simultaneously driving.", "gt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the girl is walking on the street *while* the dog is simultaneously driving. This implies that both actions are happening at the same time.", "chatgpt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A girl is walking on the street while a dog is simultaneously driving.", "gt-answer": "A. A girl is walking on the street while a dog is simultaneously driving", "rating": 1 } ] }, "1024867412_1034049020_1": { "order": [ { "chatgpt-reasoning": "The video description mentions that the dog is seen driving a car while a girl is walking on the street. This indicates that the events of the dog driving and the girl walking are happening at the same time.", "chatgpt-answer": "C. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is seen driving a car while a girl is walking on the street. The dog is wearing sunglasses and a tie, and the girl is carrying a blue umbrella. The video showcases the dog's ability to drive the car while the girl walks on the street.", "gt-answer": "A. A dog is driving, then a girl is walking on the street", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dog is driving a car while the girl is walking on the street. This indicates that both events are happening simultaneously.", "chatgpt-answer": "C. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is seen driving a car while a girl is walking on the street. The video captures the dog's movements as it drives, while the girl continues to walk. The video showcases the dog's ability to drive a car while the girl goes about her day. The video is a unique and interesting display of the dog's skills and the girl's casual stroll.", "gt-answer": "A. A dog is driving, then a girl is walking on the street", "rating": 0 }, { "chatgpt-reasoning": "The video description states that a dog is driving a car while a girl is walking on the street. This implies that both actions are happening simultaneously, so neither the dog driving nor the girl walking occurs before the other.", "chatgpt-answer": "C. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is driving a car while a girl is walking on the street.", "gt-answer": "A. A dog is driving, then a girl is walking on the street", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the dog is driving the car while the girl continues her walk. This implies that both events are happening simultaneously.", "chatgpt-answer": "C. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is seen driving a car while a girl walks on the street. The video showcases the dog's ability to drive the car while the girl continues her walk. The video captures the unique and amusing scene of a dog driving a car while a girl walks on the street.", "gt-answer": "A. A dog is driving, then a girl is walking on the street", "rating": 0 } ] }, "1024867412_1034049020_2": { "order": [ { "chatgpt-reasoning": "The video description states that the dog is seen driving in different locations, including a street and a parking lot, while the video also shows a girl walking on the street while the dog is driving. This indicates that the events occur simultaneously, with the dog driving and the girl walking happening at the same time.", "chatgpt-answer": "B. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is seen driving a car while wearing sunglasses. The dog is also seen smiling at the camera. The video shows the dog driving in different locations, including a street and a parking lot. The dog is seen wearing sunglasses in each scene. The video also shows a girl walking on the street while the dog is driving.", "gt-answer": "A. A girl is walking on the street, then a dog is driving", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, it states that \"A dog is seen driving a car while a girl walks on the street.\" This implies that the dog is driving first, followed by the girl walking on the street.", "chatgpt-answer": "C. A dog is driving, then a girl is walking on the street", "video-llm-prediction": "A dog is seen driving a car while a girl walks on the street. The dog is wearing sunglasses and is seen smiling at the camera. The video captures the dog's playful and adventurous nature as it takes on the role of a human driver. The girl's presence on the street adds an element of contrast to the scene, highlighting the dog's unique ability to drive a car. The video is a lighthearted and entertaining take on the idea of a dog driving a car, and it is sure to bring a smile to anyone's face who watches it", "gt-answer": "A. A girl is walking on the street, then a dog is driving", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dog is driving the car while the girl is walking on the street.", "chatgpt-answer": "B. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is seen driving a car while a girl is walking on the street. The dog is wearing sunglasses and a tongue out. The video shows the dog driving the car and the girl walking on the street.", "gt-answer": "A. A girl is walking on the street, then a dog is driving", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dog is seen driving a car while a girl is walking on the street, highlighting the dog's unique ability to drive. This implies that the events are happening simultaneously.", "chatgpt-answer": "B. A girl is walking on the street while a dog is simultaneously driving", "video-llm-prediction": "A dog is seen driving a car while a girl is walking on the street. The dog is wearing sunglasses and a denim jacket. The video captures the dog's playful and adventurous nature as it takes the wheel and drives the car. The girl's presence on the street adds an element of contrast to the scene, highlighting the dog's unique ability to drive. The video showcases the dog's confidence and ability to navigate the streets, making it a fun and entertaining watch.", "gt-answer": "A. A girl is walking on the street, then a dog is driving", "rating": 0 } ] }, "1096238125_1098970151_0": { "order": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that \"Two people are lifting weights and then a cat is licking its paw.\" This clearly indicates the order of events.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "B. The events are happening simultaneously, there is no specific order", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"Two people are lifting weights and then a cat is licking its paw,\" indicating a sequential order of events.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "B. The events are happening simultaneously, there is no specific order", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"Two people are lifting weights and then a cat is licking its paw\". This indicates a specific order of events, where the two people lifting weights come before the cat licking its paw.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "B. The events are happening simultaneously, there is no specific order", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"Two people are lifting weights and then a cat is licking its paw,\" indicating a specific order of events.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "B. The events are happening simultaneously, there is no specific order", "rating": 0 } ] }, "1096238125_1098970151_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the cat is licking its paw while the people are lifting weights. It also mentions that the cat's behavior is consistent throughout the video, while the people's exercise routine is not. Therefore, we can conclude that the cat's behavior of licking its paw happens before or at the same time as the people lifting weights.", "chatgpt-answer": "C. The events are happening simultaneously, there is no specific order.", "video-llm-prediction": "The video shows a cat licking its paw while two people are lifting weights in the background. The cat continues to lick its paw while the people continue to lift weights. The video captures the cat's behavior of licking its paw while the people are exercising. The cat's behavior is consistent with the video, while the people's exercise routine is not.", "gt-answer": "B. Two people are lifting weights and then a cat is licking its paw", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the cat continues to lick its paw while the people continue to lift weights, implying that the events are happening simultaneously.", "chatgpt-answer": "C. The events are happening simultaneously, there is no specific order", "video-llm-prediction": "The video shows a cat licking its paw while two people are lifting weights in the background. The cat continues to lick its paw while the people continue to lift weights.", "gt-answer": "B. Two people are lifting weights and then a cat is licking its paw", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the cat is seen licking its paw while two people are lifting weights in the background. It further mentions that the cat continues to lick its paw while the people continue to lift weights. This indicates that the cat starts licking its paw before the people start lifting weights, and both actions happen simultaneously.", "chatgpt-answer": "C. The events are happening simultaneously, there is no specific order", "video-llm-prediction": "A cat is seen licking its paw while two people are lifting weights in the background. The cat continues to lick its paw while the people continue to lift weights.", "gt-answer": "B. Two people are lifting weights and then a cat is licking its paw", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the cat is seen licking its paw while two people are lifting weights in the background, and it further mentions that the cat continues to lick its paw while the people continue to lift weights. This indicates that the cat's action (licking its paw) is happening concurrently with the people's action (lifting weights), so the events are happening simultaneously without a specific order.", "chatgpt-answer": "C. The events are happening simultaneously, there is no specific order", "video-llm-prediction": "A cat is seen licking its paw while two people are lifting weights in the background. The cat continues to lick its paw while the people continue to lift weights.", "gt-answer": "B. Two people are lifting weights and then a cat is licking its paw", "rating": 0 } ] }, "1096238125_1098970151_2": { "order": [ { "chatgpt-reasoning": "Based on the video description, it is mentioned that \"The video shows a man and a woman lifting weights in a gym\" and then it states \"The video also shows a cat licking its paw\". This indicates that the event of two people lifting weights happens before the event of the cat licking its paw.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "The video shows a man and a woman lifting weights in a gym. The woman is wearing a blue shirt and white tights, while the man is wearing a grey shirt and black shorts. The woman is wearing a ponytail, and the man is wearing a beard. The woman is also wearing a watch on her left hand. The video also shows a cat licking its paw, and the woman is seen doing a yoga pose on the floor.", "gt-answer": "B. A cat is licking its paw and then two people are lifting weights", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the cat's actions (licking its paw) are shown before the people start lifting weights. Therefore, option B is the correct answer.", "chatgpt-answer": "B. A cat is licking its paw and then two people are lifting weights", "video-llm-prediction": "The video shows two people lifting weights while a cat is licking its paw. The cat's actions are shown before the people start lifting weights.", "gt-answer": "B. A cat is licking its paw and then two people are lifting weights", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that \"Two people are lifting weights and then a cat is licking its paw.\" This indicates that the first event is the two people lifting weights, followed by the cat licking its paw.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "B. A cat is licking its paw and then two people are lifting weights", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"Two people are lifting weights and then a cat is licking its paw\", indicating a sequential order of events.", "chatgpt-answer": "A. Two people are lifting weights and then a cat is licking its paw", "video-llm-prediction": "Two people are lifting weights and then a cat is licking its paw.", "gt-answer": "B. A cat is licking its paw and then two people are lifting weights", "rating": 0 } ] }, "1069717165_1041584314_0": { "order": [ { "chatgpt-reasoning": "The video description states that the woman is showing different expressions first, followed by the man showing different expressions. It also mentions that the woman and the man are looking at each other, indicating a sequence of events.", "chatgpt-answer": "A. First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "The video features a woman and a man showing different expressions. The woman is seen smiling and laughing while the man is seen smiling and laughing. The video also shows the woman and the man looking at each other.", "gt-answer": "C. Both the woman and the man are showing different expressions at the same time.", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is showing different expressions first, followed by the man showing different expressions. It suggests a sequence of events.", "chatgpt-answer": "A. First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "The video features a woman and a man who are both showing different expressions. The woman is seen smiling and laughing, while the man is seen smiling and looking at the camera. The video seems to be a lighthearted and playful moment between the two individuals.", "gt-answer": "C. Both the woman and the man are showing different expressions at the same time.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman and the man are shown smiling at the camera, followed by the woman showing different expressions, and then the man showing different expressions. This sequence of events suggests that the woman shows different expressions first, followed by the man.", "chatgpt-answer": "A. First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "A woman and a man are shown smiling at the camera. The woman then shows different expressions, followed by the man.", "gt-answer": "C. Both the woman and the man are showing different expressions at the same time.", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is shown first, with expressions of smiling and laughing, followed by the man who has expressions of smiling and frowning. This indicates a sequence of events where the woman shows her expressions first and then the man.", "chatgpt-answer": "A. First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "The video features a woman and a man showing different expressions. The woman is seen smiling and laughing, while the man is seen smiling and frowning. The video appears to be a montage of different expressions, with the woman and man showcasing a range of emotions. The video is likely intended to capture the viewer's attention and evoke a range of emotions.", "gt-answer": "C. Both the woman and the man are showing different expressions at the same time.", "rating": 0 } ] }, "1069717165_1041584314_1": { "order": [ { "chatgpt-reasoning": "The video description states that both the man and the woman are smiling, laughing, and making funny faces. It does not mention any specific order of events or indicate that one person is showing expressions first before the other.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a man and a woman showing different expressions. The man is seen smiling and laughing while the woman is seen smiling and laughing. The video also shows the man and woman making funny faces.", "gt-answer": "B. First, a woman is showing different expressions; then, a man is showing different expressions.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is showing different expressions first (\"The man is seen smiling and laughing\") and then the woman is showing different expressions (\"the woman is seen smiling and laughing\"). It does not mention anything about them showing expressions at the same time, so we can rule out option C.", "chatgpt-answer": "A. First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "The video features a man and a woman showing different expressions. The man is seen smiling and laughing while the woman is seen smiling and laughing. The video also shows a man with a beard and a woman with blonde hair.", "gt-answer": "B. First, a woman is showing different expressions; then, a man is showing different expressions.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that both the man and the woman are showing different expressions. It also mentions that the man is seen smiling and laughing while the woman is seen smiling and laughing. Lastly, it says that the man and woman are looking at the camera. Based on this information, it can be inferred that both the man and the woman are showing their expressions simultaneously.", "chatgpt-answer": "C. Both the woman and the man are showing different expressions at the same time.", "video-llm-prediction": "The video shows a man and a woman showing different expressions. The man is seen smiling and laughing while the woman is seen smiling and laughing. The video also shows the man and woman looking at the camera.", "gt-answer": "B. First, a woman is showing different expressions; then, a man is showing different expressions.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen smiling and laughing first, while the woman is seen with a serious expression. Then it mentions that the man and woman are making funny faces. Therefore, the correct order of events in the video is that the man is showing different expressions first, followed by the woman.", "chatgpt-answer": "A. First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "The video features a man and a woman showing different expressions. The man is seen smiling and laughing, while the woman is seen with a serious expression. The video also shows the man and woman making funny faces.", "gt-answer": "B. First, a woman is showing different expressions; then, a man is showing different expressions.", "rating": 0 } ] }, "1069717165_1041584314_2": { "order": [ { "chatgpt-reasoning": "The video description states that the video starts with a woman showing different expressions, followed by a man doing the same. Then, both the woman and the man are shown showing different expressions at the same time. Therefore, the correct answer is A. First, a woman is showing different expressions; then, a man is showing different expressions.", "chatgpt-answer": "A. First, a woman is showing different expressions; then, a man is showing different expressions.", "video-llm-prediction": "The video starts with a woman showing different expressions, followed by a man doing the same. The video then shows both the woman and the man showing different expressions at the same time. The video seems to be a collection of different facial expressions, with no clear context or purpose. The woman and the man are the only individuals shown in the video, and there is no indication of any background or setting. Overall, the video appears to be a simple collection of facial expressions, with no clear narrative or purpose.", "gt-answer": "C. First, a man is showing different expressions; then, a woman is showing different expressions.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen smiling and laughing, while the woman is seen smiling and laughing. It also mentions that the woman is looking at the camera and smiling. Based on this information, it can be inferred that first, the man is showing different expressions, and then, the woman is showing different expressions.", "chatgpt-answer": "C. First, a man is showing different expressions; then, a woman is showing different expressions.", "video-llm-prediction": "The video features a man and a woman who are both showing different expressions. The man is seen smiling and laughing, while the woman is seen smiling and laughing. The video also shows the woman looking at the camera and smiling.", "gt-answer": "C. First, a man is showing different expressions; then, a woman is showing different expressions.", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen smiling and laughing while the woman is also seen smiling and laughing. It also mentions that the man and woman are sitting in front of a camera, but it does not mention any specific order of events.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a man and a woman showing different expressions. The man is seen smiling and laughing while the woman is seen smiling and laughing. The video also shows the man and woman sitting in front of a camera.", "gt-answer": "C. First, a man is showing different expressions; then, a woman is showing different expressions.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"The man is seen smiling and making different facial expressions, while the woman is also seen smiling and making different facial expressions.\" This indicates that both the man and the woman are showing different expressions at the same time.", "chatgpt-answer": "B. Both the woman and the man are showing different expressions at the same time.", "video-llm-prediction": "The video showcases a man and a woman displaying various facial expressions. The man is seen smiling and making different facial expressions, while the woman is also seen smiling and making different facial expressions. The video captures the emotions and expressions of the two individuals, providing a glimpse into their personalities.", "gt-answer": "C. First, a man is showing different expressions; then, a woman is showing different expressions.", "rating": 0 } ] }, "1055413730_1055973887_0": { "order": [ { "chatgpt-reasoning": "The video description mentions that both the fire ball is expanding and the earth is spinning simultaneously.", "chatgpt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "The video shows a fire ball expanding and the earth spinning simultaneously.", "gt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is expanding and the earth is spinning simultaneously. This means that both events are happening at the same time.", "chatgpt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "The video shows a fire ball expanding and the earth spinning simultaneously.", "gt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that \"the fire ball is expanding and the earth is spinning simultaneously\". Therefore, the correct answer is C. Simultaneously, the earth is spinning and the fire ball is expanding.", "chatgpt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "A video shows a fire ball expanding and the earth spinning simultaneously.", "gt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "rating": 1 }, { "chatgpt-reasoning": "The video description states that both the fire ball is expanding and the earth is spinning. However, it does not provide any specific order of events. Therefore, it can be inferred that these two events are happening simultaneously.", "chatgpt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "A fire ball is shown expanding while the earth is spinning.", "gt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "rating": 1 } ] }, "1055413730_1055973887_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the fire ball is expanding from a small to a large size while the earth is spinning in the background. This indicates that the fire ball's expansion happens first, followed by the earth's spinning.", "chatgpt-answer": "A. The fire ball is expanding, then the earth is spinning", "video-llm-prediction": "The video shows a fire ball expanding and the earth spinning simultaneously. The fire ball is seen expanding from a small to a large size, while the earth is spinning in the background. The video captures the fire ball's expansion from a small to a large size, and the earth's spinning in the background. The video showcases the fire ball's expansion from a small to a large size, while the earth is spinning in the background. The video captures the fire ball's expansion from a small to a large size, and the earth's spinning in the background. The video", "gt-answer": "B. The earth is spinning, then the fire ball is expanding", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is shown expanding in the beginning, and then the earth is shown spinning. Therefore, the correct order of events in the video is:", "chatgpt-answer": "A. The fire ball is expanding, then the earth is spinning", "video-llm-prediction": "The video depicts a fire ball expanding and the earth spinning simultaneously. The fire ball is shown expanding in the beginning, and then the earth is shown spinning. The video captures the fire ball's expansion and the earth's spinning in a visually appealing manner. The video's visuals are captivating, and the sound of the fire ball's expansion and the earth's spinning adds to the overall experience. The video's message is clear, and it is evident that the video is meant to be watched in a dark room. The video's visuals are", "gt-answer": "B. The earth is spinning, then the fire ball is expanding", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the fire ball is expanding and the earth is spinning simultaneously.", "chatgpt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "The video shows a fire ball expanding and the earth spinning simultaneously.", "gt-answer": "B. The earth is spinning, then the fire ball is expanding", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is expanding from a small to a large size and the earth is spinning in the background simultaneously. This indicates that both events, the expansion of the fire ball and the spinning of the earth, are happening at the same time.", "chatgpt-answer": "C. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "The video shows a fire ball expanding and the earth spinning simultaneously. The fire ball is seen expanding from a small to a large size, while the earth is spinning in the background. The video captures the fire ball's growth from a small to a large size, and the earth's spinning is also visible in the background. The video provides a mesmerizing view of the fire ball's expansion and the earth's spinning.", "gt-answer": "B. The earth is spinning, then the fire ball is expanding", "rating": 0 } ] }, "1055413730_1055973887_2": { "order": [ { "chatgpt-reasoning": "From the video description, it is mentioned that the video starts with a large fire ball exploding in the dark. Then, the earth spinning is shown. Finally, the video ends with the earth spinning. Therefore, the correct order of events in the video is B. The fire ball is expanding, then the earth is spinning.", "chatgpt-answer": "B. The fire ball is expanding, then the earth is spinning", "video-llm-prediction": "The video starts with a large fire ball exploding in the dark, and then the earth is shown spinning. The fire ball is expanding, and the earth is spinning. The video ends with the earth spinning.", "gt-answer": "B. The fire ball is expanding, then the earth is spinning", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the fire ball is seen expanding first and then the earth is shown spinning. Therefore, the correct order of events in the video is: The fire ball is expanding, then the earth is spinning.", "chatgpt-answer": "B. The fire ball is expanding, then the earth is spinning", "video-llm-prediction": "The video showcases a fire ball expanding and the earth spinning simultaneously. The fire ball is seen expanding and then the earth is shown spinning. The video captures the beauty of the earth and the fire ball's expansion.", "gt-answer": "B. The fire ball is expanding, then the earth is spinning", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically states that the fire ball is expanding and the earth is spinning simultaneously.", "chatgpt-answer": "A. Simultaneously, the earth is spinning and the fire ball is expanding", "video-llm-prediction": "The video shows a fire ball expanding and the earth spinning simultaneously.", "gt-answer": "B. The fire ball is expanding, then the earth is spinning", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the fire ball is expanding first, and then the earth is spinning.", "chatgpt-answer": "B. The fire ball is expanding, then the earth is spinning", "video-llm-prediction": "The video shows a fire ball expanding and then the earth spinning.", "gt-answer": "B. The fire ball is expanding, then the earth is spinning", "rating": 1 } ] }, "1058907236_1021488277_0": { "order": [ { "chatgpt-reasoning": "The video description mentions that \"A person is seen picking up a pineapple and then a squirrel is foraging in the same area.\" This indicates that the person picking up a pineapple happens before the squirrel starts foraging.", "chatgpt-answer": "A. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "A person is seen picking up a pineapple and then a squirrel is foraging in the same area. The video showcases the interaction between the person and the squirrel in the same location.", "gt-answer": "C. Both events are happening concurrently", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is seen picking up a pineapple and then the squirrel is seen foraging in the background. This indicates that the events are happening sequentially, with the person picking up the pineapple first and then the squirrel foraging.", "chatgpt-answer": "A. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "The video showcases a person picking up a pineapple and a squirrel foraging in the same scene. The person is seen holding the pineapple in their hand, while the squirrel is seen foraging in the background. The video captures the natural beauty of the forest and the interaction between humans and wildlife. The sound of the squirrel's movements and the rustling of leaves in the background adds to the immersive experience. The video highlights the importance of preserving natural habitats and the need to coexist with wildlife.", "gt-answer": "C. Both events are happening concurrently", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person is seen picking up a pineapple and then a squirrel is foraging, indicating a sequential order of events.", "chatgpt-answer": "A. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "A person is seen picking up a pineapple and then a squirrel is foraging.", "gt-answer": "C. Both events are happening concurrently", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"A person is seen picking up a pineapple and then a squirrel is foraging.\" This indicates the order of events in the video.", "chatgpt-answer": "A. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "A person is seen picking up a pineapple and then a squirrel is foraging. The video showcases the interaction between humans and wildlife in a natural setting.", "gt-answer": "C. Both events are happening concurrently", "rating": 0 } ] }, "1058907236_1021488277_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the squirrel is seen foraging in the woods and then the person picks up a pineapple. Therefore, the correct order of events is B. A squirrel is foraging and then a person is picking up a pineapple.", "chatgpt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "The video shows a squirrel foraging in the woods and a person picking up a pineapple. The squirrel is seen eating a nut and then running away. The person is shown picking up the pineapple and then cutting it open. The video ends with the person eating the pineapple.", "gt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the squirrel is seen eating a nut while the person is picking up a pineapple from the ground. Therefore, the order of events in the video is that the squirrel is foraging and then a person is picking up a pineapple.", "chatgpt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "The video showcases a squirrel foraging in a forest and a person picking up a pineapple from the ground. The squirrel is seen eating a nut, while the person is seen picking up a pineapple from the ground. The video also features a close-up shot of a pineapple, with a person's hand holding it. The video captures the beauty of nature and the simplicity of everyday life.", "gt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the person is picking up a pineapple first and then a squirrel is foraging.", "chatgpt-answer": "C. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "A person is seen picking up a pineapple and then a squirrel is foraging.", "gt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"a person is seen picking up a pineapple and then a squirrel is foraging\". This indicates that the events are happening sequentially, with the person picking up the pineapple first and then the squirrel foraging.", "chatgpt-answer": "C. A person is picking up a pineapple and then a squirrel is foraging", "video-llm-prediction": "A person is seen picking up a pineapple and then a squirrel is foraging. The video showcases the natural behavior of animals in their environment.", "gt-answer": "B. A squirrel is foraging and then a person is picking up a pineapple", "rating": 0 } ] }, "1058907236_1021488277_2": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the squirrel is foraging first, followed by a person picking up a pineapple. The events are happening sequentially, not concurrently.", "chatgpt-answer": "C. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "A squirrel is foraging and then a person is picking up a pineapple.", "gt-answer": "B. A person is picking up a pineapple and then a squirrel is foraging", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the squirrel is seen foraging in a forest first, and then a person is shown picking up a pineapple. This indicates that the order of events in the video is \"A squirrel is foraging and then a person is picking up a pineapple.\"", "chatgpt-answer": "C. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "A squirrel is seen foraging in a forest, and then a person is shown picking up a pineapple. The squirrel continues to forage while the person holds the pineapple.", "gt-answer": "B. A person is picking up a pineapple and then a squirrel is foraging", "rating": 0 }, { "chatgpt-reasoning": "According to the video description, the events occur in the following order: first, a squirrel is seen foraging in the woods, then a person picks up a pineapple, and finally, the squirrel eats the pineapple.", "chatgpt-answer": "C. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "A squirrel is seen foraging in the woods, while a person picks up a pineapple. The squirrel then eats the pineapple.", "gt-answer": "B. A person is picking up a pineapple and then a squirrel is foraging", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that a squirrel is foraging and then a person is picking up a pineapple.", "chatgpt-answer": "C. A squirrel is foraging and then a person is picking up a pineapple", "video-llm-prediction": "A squirrel is foraging and then a person is picking up a pineapple.", "gt-answer": "B. A person is picking up a pineapple and then a squirrel is foraging", "rating": 0 } ] }, "1054717541_1047368344_0": { "order": [ { "chatgpt-reasoning": "The video description clearly states that \"a girl jumps into the water while a person kneads dough\". This implies that the action of the girl jumping into the water and the person kneading dough are happening simultaneously.", "chatgpt-answer": "C. a girl jumping into water while a person kneading dough", "video-llm-prediction": "A girl jumps into the water while a person kneads dough.", "gt-answer": "C. a girl jumping into water while a person kneading dough", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the girl jumping into the water is followed by a person kneading dough. It also mentions that the scene shifts to the person kneading dough with the girl jumping into the water in the background. This indicates that the correct sequence of events in the video is \"a girl jumping into water followed by a person kneading dough.\"", "chatgpt-answer": "A. a girl jumping into water followed by a person kneading dough", "video-llm-prediction": "The video showcases a girl jumping into a body of water, followed by a person kneading dough. The scene then shifts to the person kneading dough, with the girl jumping into the water in the background. The video captures the serene beauty of nature and the joy of simple pleasures.", "gt-answer": "C. a girl jumping into water while a person kneading dough", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that \"A girl jumps into the water while a person kneads dough.\" This indicates that the girl is jumping into the water at the same time as the person is kneading dough.", "chatgpt-answer": "C. a girl jumping into water while a person kneading dough", "video-llm-prediction": "A girl jumps into the water while a person kneads dough.", "gt-answer": "C. a girl jumping into water while a person kneading dough", "rating": 1 }, { "chatgpt-reasoning": "The video description states that \"a girl jumps into the water while a person kneads dough.\" This indicates that the girl's action of jumping into the water happens at the same time as the person kneading dough. Therefore, the correct answer is C.", "chatgpt-answer": "C. a girl jumping into water while a person kneading dough", "video-llm-prediction": "A girl jumps into the water while a person kneads dough.", "gt-answer": "C. a girl jumping into water while a person kneading dough", "rating": 1 } ] }, "1054717541_1047368344_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the person is kneading dough followed by a girl jumping into water.", "chatgpt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "A person is kneading dough followed by a girl jumping into water.", "gt-answer": "A. a person is kneading dough followed by a girl jumping into water", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the sequence of events in the video is \"a person kneading dough, followed by a girl jumping into water.\" This means that first, a person is seen kneading dough, and then a girl jumps into water.", "chatgpt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "The video showcases a person kneading dough, followed by a girl jumping into water. The scene then shifts to a girl running on a dock, followed by a person kneading dough. The video captures the essence of nature and the joy of outdoor activities.", "gt-answer": "A. a person is kneading dough followed by a girl jumping into water", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the person is kneading dough followed by a girl jumping into water. Therefore, option A is the correct answer.", "chatgpt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "A person is kneading dough followed by a girl jumping into water.", "gt-answer": "A. a person is kneading dough followed by a girl jumping into water", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the person is kneading dough followed by a girl jumping into water.", "chatgpt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "A person is kneading dough followed by a girl jumping into water.", "gt-answer": "A. a person is kneading dough followed by a girl jumping into water", "rating": 1 } ] }, "1054717541_1047368344_2": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the sequence of events starts with a girl jumping into water while a person is kneading dough, followed by a man kneading dough in a kitchen.", "chatgpt-answer": "C. a girl jumping into water while a person kneading dough", "video-llm-prediction": "The video starts with a girl jumping into the water while a person is kneading dough. The scene then shifts to a man kneading dough in a kitchen. The man is seen adding flour to the dough and kneading it. The video then shows the man shaping the dough into a ball and placing it on a wooden board. The man then rolls the dough out and cuts it into pieces. The video ends with the man placing the dough on a baking sheet and putting it in the oven. Overall, the video showcases the process of making dough and sh", "gt-answer": "B. a girl jumping into water followed by a person kneading dough", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girl is jumping into water while a person is kneading dough. This indicates that both actions are happening simultaneously.", "chatgpt-answer": "C. a girl jumping into water while a person kneading dough", "video-llm-prediction": "The video showcases a girl jumping into water while a person kneads dough. The video also features a man kneading dough in a kitchen.", "gt-answer": "B. a girl jumping into water followed by a person kneading dough", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that a person is kneading dough followed by a girl jumping into water. This implies a sequential order of events.", "chatgpt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "A person is kneading dough followed by a girl jumping into water.", "gt-answer": "B. a girl jumping into water followed by a person kneading dough", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is kneading dough followed by a girl jumping into water.", "chatgpt-answer": "A. a person is kneading dough followed by a girl jumping into water", "video-llm-prediction": "A person is kneading dough followed by a girl jumping into water.", "gt-answer": "B. a girl jumping into water followed by a person kneading dough", "rating": 0 } ] }, "1089201973_1086820415_0": { "order": [ { "chatgpt-reasoning": "The video description clearly states that \"A person is kicking football and then a big wave is shown\". This indicates that the person kicking the football happens first, followed by the appearance of the big wave.", "chatgpt-answer": "A. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is kicking football and then a big wave is shown.", "gt-answer": "B. The events are shown simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"A person is kicking football and then a big wave is shown\". This indicates that the person first kicks the football and then the big wave is shown.", "chatgpt-answer": "A. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is kicking football and then a big wave is shown.", "gt-answer": "B. The events are shown simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that \"A person is kicking football and then a big wave is shown\", indicating the order of events.", "chatgpt-answer": "A. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is kicking football and then a big wave is shown.", "gt-answer": "B. The events are shown simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"A person is seen kicking a football, and then a big wave is shown.\" This indicates that the person first kicks the football and then the big wave is shown.", "chatgpt-answer": "A. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is seen kicking a football, and then a big wave is shown. The video showcases the person's movements and the wave's impact.", "gt-answer": "B. The events are shown simultaneously", "rating": 0 } ] }, "1089201973_1086820415_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the video starts with a person kicking a football, then a big wave is shown, and finally, the person is seen kicking the football again before the video ends. This means that the correct order of events in the video is \"C. A person is kicking football and then a big wave is shown.\"", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "The video starts with a person kicking a football, and then a big wave is shown. The video then shows the entire video, and the person is seen kicking the football again. The video ends with a big wave being shown.", "gt-answer": "C. A person is kicking football and then a big wave is shown", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the person is kicking a football first and then a big wave is shown. Therefore, the correct answer is option C.", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "The video showcases a person kicking a football, followed by a big wave crashing. The video captures the essence of the game of football and the power of nature's elements. The person's kick is a representation of the game's intensity and the wave's crash symbolizes the game's unpredictability. The video's visuals are breathtaking, and the sound of the waves adds to the immersive experience. Overall, the video is a perfect representation of the game of football and the beauty of nature.", "gt-answer": "C. A person is kicking football and then a big wave is shown", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that first the person is kicking football and then a big wave is shown.", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is kicking football and then a big wave is shown.", "gt-answer": "C. A person is kicking football and then a big wave is shown", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is seen kicking a football, and then a big wave is shown. Therefore, the correct order of events in the video is C. A person is kicking football and then a big wave is shown.", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is seen kicking a football, and then a big wave is shown. The video showcases the power of nature and the beauty of sports.", "gt-answer": "C. A person is kicking football and then a big wave is shown", "rating": 1 } ] }, "1089201973_1086820415_2": { "order": [ { "chatgpt-reasoning": "The video description mentions that the events are shown simultaneously, which means that both events are happening at the same time.", "chatgpt-answer": "B. The events are shown simultaneously", "video-llm-prediction": "The video starts with a big wave shown, and then a person is seen kicking a football. The events are shown simultaneously.", "gt-answer": "A. A big wave is shown and then a person is kicking football", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person is kicking a football on a field, followed by a big wave crashing in the ocean. This indicates that the order of events in the video is that the person is kicking football first and then a big wave is shown.", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown.", "video-llm-prediction": "The video showcases a person kicking a football on a field, followed by a big wave crashing in the ocean. The video captures the beauty of nature and the excitement of sports.", "gt-answer": "A. A big wave is shown and then a person is kicking football", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"a person is seen kicking a football on a field while a big wave is shown in the background.\" This suggests that the person kicking the football comes before the big wave being shown.", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is seen kicking a football on a field while a big wave is shown in the background. The video showcases the beauty of nature and the joy of playing football.", "gt-answer": "A. A big wave is shown and then a person is kicking football", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"A person is seen kicking a football on a field, and then a big wave is shown\". This indicates that first the person is kicking the football and then the big wave is shown.", "chatgpt-answer": "C. A person is kicking football and then a big wave is shown", "video-llm-prediction": "A person is seen kicking a football on a field, and then a big wave is shown. The video showcases the power of the ocean and the excitement of playing football.", "gt-answer": "A. A big wave is shown and then a person is kicking football", "rating": 0 } ] }, "1080990179_1086820415_0": { "order": [ { "chatgpt-reasoning": "The video description mentions that the video starts with a close-up shot of an apple, then transitions to a big wave crashing in the ocean, and ends with the apple drying out. Therefore, the correct order of events is: An apple is drying out and then a big wave is shown.", "chatgpt-answer": "C. An apple is drying out and then a big wave is shown", "video-llm-prediction": "The video starts with a close-up shot of an apple, which then transitions to a big wave crashing in the ocean. The apple is shown drying out, and the wave is shown crashing in the ocean. The video ends with the apple drying out.", "gt-answer": "A. At the same time, an apple is drying out and a big wave is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the process of an apple drying out is showcased, with a big wave being shown in the background. Therefore, the correct order of events in the video is first the big wave is shown, and then the apple is drying out.", "chatgpt-answer": "B. A big wave is shown and then an apple is drying out", "video-llm-prediction": "The video showcases the process of an apple drying out, with a big wave being shown in the background. The apple is seen hanging on a tree and then being left to dry out on a counter. The video also features a close-up shot of the apple, highlighting its texture and color. The drying process is shown in detail, with the apple being left to dry for an extended period. The video ends with a shot of the apple on the counter, emphasizing its transformation from a fresh fruit to a dried one.", "gt-answer": "A. At the same time, an apple is drying out and a big wave is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description states that first, a close-up of an apple is shown, followed by a big wave crashing. Then, the apple is shown drying out. Therefore, the correct order of events in the video is: A big wave is shown and then an apple is drying out.", "chatgpt-answer": "B. A big wave is shown and then an apple is drying out", "video-llm-prediction": "The video shows a close-up of an apple, followed by a big wave crashing. The apple is then shown drying out.", "gt-answer": "A. At the same time, an apple is drying out and a big wave is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the process of an apple drying out is showcased while a big wave is shown in the background. This indicates that first, the apple is drying out and then the big wave is shown.", "chatgpt-answer": "C. An apple is drying out and then a big wave is shown", "video-llm-prediction": "The video showcases the process of an apple drying out while a big wave is shown in the background. The video captures the natural beauty of the apple and the power of the ocean waves.", "gt-answer": "A. At the same time, an apple is drying out and a big wave is shown", "rating": 0 } ] }, "1080990179_1086820415_1": { "order": [ { "chatgpt-reasoning": "The video description mentions that the video starts with a close-up shot of an apple, which then transitions to a big wave crashing. The apple is shown drying out, and the wave is shown crashing at the same time. The video ends with the apple still drying out. Therefore, the correct order of events in the video is that at the same time, an apple is drying out and a big wave is shown.", "chatgpt-answer": "C. At the same time, an apple is drying out and a big wave is shown", "video-llm-prediction": "The video starts with a close-up shot of an apple, which then transitions to a big wave crashing. The apple is shown drying out, and the wave is shown crashing at the same time. The video ends with the apple still drying out.", "gt-answer": "A. An apple is drying out and then a big wave is shown", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video showcases the process of an apple drying out first, and then a big wave is shown. It does not mention that these events are happening simultaneously or in a different order.", "chatgpt-answer": "A. An apple is drying out and then a big wave is shown", "video-llm-prediction": "The video showcases the process of an apple drying out, with a focus on the apple's transformation from fresh to dry. The video also features a big wave, which adds a sense of scale and contrast to the scene. The combination of the apple and the wave creates a visually striking image that captures the viewer's attention.", "gt-answer": "A. An apple is drying out and then a big wave is shown", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the apple is drying out while a big wave is shown in the background. This indicates that the drying of the apple happens first and then the big wave is shown.", "chatgpt-answer": "A. An apple is drying out and then a big wave is shown", "video-llm-prediction": "The video shows an apple drying out while a big wave is shown in the background.", "gt-answer": "A. An apple is drying out and then a big wave is shown", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the video starts with a close-up shot of an apple, then transitions to a shot of the apple drying out. After that, the camera pans out to show the apple in the context of the video. Finally, the video ends with a shot of the apple drying out. There is no mention of a big wave being shown simultaneously or before the apple drying out.", "chatgpt-answer": "A. An apple is drying out and then a big wave is shown", "video-llm-prediction": "The video showcases the process of an apple drying out while a big wave is shown in the background. The video starts with a close-up shot of an apple, which then transitions to a shot of the apple drying out. The camera then pans out to show the apple in the context of the video. The video ends with a shot of the apple drying out.", "gt-answer": "A. An apple is drying out and then a big wave is shown", "rating": 1 } ] }, "1080990179_1086820415_2": { "order": [ { "chatgpt-reasoning": "The video description provides a clear sequence of events. It states that the video starts with a close-up shot of an apple, then transitions to a big wave crashing, and finally shows the apple being cut in half.", "chatgpt-answer": "B. A big wave is shown and then an apple is drying out", "video-llm-prediction": "The video starts with a close-up shot of an apple, which then transitions to a big wave crashing. The video then shows the apple drying out, with the waves crashing in the background. The video ends with the apple being cut in half.", "gt-answer": "B. A big wave is shown and then an apple is drying out", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the video showcases the process of an apple drying out, with a big wave being shown in the background. Therefore, the correct answer is C - \"An apple is drying out and then a big wave is shown.\"", "chatgpt-answer": "C. An apple is drying out and then a big wave is shown.", "video-llm-prediction": "The video showcases the process of an apple drying out, with a big wave being shown in the background. The apple is seen in various stages of drying, from being fresh to being completely dried out. The video also captures the beauty of the ocean, with waves crashing against the shore and the sun shining down on the water. The combination of the apple and the ocean creates a serene and peaceful atmosphere, making the video a perfect representation of the beauty of nature.", "gt-answer": "B. A big wave is shown and then an apple is drying out", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the video starts with a close-up shot of the apple, followed by a shot of the apple drying out. Then, the camera pans out to show the big wave in the background. Finally, the video ends with a shot of the apple again. This indicates that the order of events in the video is option C - An apple is drying out and then a big wave is shown.", "chatgpt-answer": "C. An apple is drying out and then a big wave is shown", "video-llm-prediction": "The video showcases the process of an apple drying out while a big wave is shown in the background. The video starts with a close-up shot of the apple, which is then followed by a shot of the apple drying out. The camera then pans out to show the big wave in the background. The video ends with a shot of the apple again.", "gt-answer": "B. A big wave is shown and then an apple is drying out", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with a close-up shot of the apple, then transitions to a shot of the apple drying out. After that, the camera pans out to show the entire apple, and the drying process continues. Finally, the video ends with a shot of the apple, which is now completely dry. There is no mention of the big wave happening at the same time as the apple drying out, so option A can be eliminated. Therefore, the correct order of events in the video is Option C: An apple is drying out and then a big wave is shown.", "chatgpt-answer": "C. An apple", "video-llm-prediction": "The video showcases the process of an apple drying out while a big wave is shown in the background. The video starts with a close-up shot of the apple, which then transitions to a shot of the apple drying out. The camera then pans out to show the entire apple, and the drying process continues. The video ends with a shot of the apple, which is now completely dry. The video provides a unique perspective on the drying process of an apple, and the big wave in the background adds an element of natural beauty to the video.", "gt-answer": "B. A big wave is shown and then an apple is drying out", "rating": 0 } ] }, "1067268403_1064645467_0": { "order": [ { "chatgpt-reasoning": "Based on the video description, it mentions that the man is doing exercise while wind turbines are rotating in the background. The description lists the actions of the man (stretching exercises, push-ups, pull-ups, squats), and in each case, it is mentioned that the wind turbines are rotating in the sea. Therefore, the correct order of events in the video is that the man is doing exercise followed by wind turbines rotating.", "chatgpt-answer": "B. A man doing exercise followed by wind turbines rotating", "video-llm-prediction": "The video starts with a man doing exercise while wind turbines are rotating in the background. The man is wearing a white shirt and black trousers, and he is doing some stretching exercises. The wind turbines are white in color, and they are rotating in the sea. The man is doing some push-ups, and the wind turbines are rotating in the sea. The man is doing some pull-ups, and the wind turbines are rotating in the sea. The man is doing some squats, and the wind turbines are rotating in the", "gt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is performing exercises in front of a beautiful sunset, and it also mentions that the wind turbines are rotating in the background. It does not specify whether the wind turbines were rotating before or after the man started doing exercises, but it indicates that both events are happening concurrently.", "chatgpt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "The video showcases a man performing exercises in front of a beautiful sunset, with wind turbines rotating in the background. The man is dressed in a white shirt and black pants, and he is seen doing push-ups and stretching his arms. The wind turbines are white and are located in the distance. The sunset is orange and yellow, with the sun setting behind the man. The video captures the serene beauty of nature and the man's dedication to his fitness routine.", "gt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man is seen doing exercise while wind turbines are rotating in the background. This implies that both events are happening simultaneously.", "chatgpt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "A man is seen doing exercise while wind turbines are rotating in the background.", "gt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, it is mentioned that a man is seen doing exercise while wind turbines are rotating in the background. This suggests that the wind turbines are already rotating before the man starts exercising. Therefore, the correct answer is:", "chatgpt-answer": "A. Wind turbines are rotating followed by a man doing exercise", "video-llm-prediction": "A man is seen doing exercise while wind turbines are rotating in the background.", "gt-answer": "C. A man doing exercise and wind turbines rotating concurrently", "rating": 0 } ] }, "1067268403_1064645467_1": { "order": [ { "chatgpt-reasoning": "Based on the video description, the video showcases both a man doing exercise and wind turbines rotating in the background. However, it does not specify the order of events. Therefore, there is not enough information to determine the correct answer.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "The video showcases a man doing exercise in a park while wind turbines are rotating in the background. The man is seen wearing a white shirt and black trousers, and he is doing exercise on a playground. The video also shows a man doing exercise on a playground, and a man doing exercise in a park. The video captures the beauty of nature and the importance of physical activity.", "gt-answer": "C. Wind turbines are rotating followed by a man doing exercise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man's exercise routine is interspersed with the rotating wind turbines, creating a visually appealing and harmonious scene. This implies that the events of the man doing exercise and wind turbines rotating are happening concurrently.", "chatgpt-answer": "A. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "The video showcases a man engaging in physical activity, possibly a workout or exercise routine, while the wind turbines in the background rotate. The man is seen wearing a white shirt and black pants, and he is positioned in front of a blue sky with clouds. The video emphasizes the connection between physical activity and the environment, highlighting the importance of incorporating nature into our daily routines. The man's exercise routine is interspersed with the rotating wind turbines, creating a visually appealing and harmonious scene. The video encourages viewers to appreciate the", "gt-answer": "C. Wind turbines are rotating followed by a man doing exercise", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen doing exercise while wind turbines are rotating in the background. This implies that both events are happening at the same time, so the correct answer is A.", "chatgpt-answer": "A. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "A man is seen doing exercise while wind turbines are rotating in the background. The video showcases the man's physical fitness routine and the beauty of nature.", "gt-answer": "C. Wind turbines are rotating followed by a man doing exercise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is performing exercise while wind turbines rotate in the background. This implies that both events are happening at the same time, therefore the correct answer is A. A man doing exercise and wind turbines rotating concurrently.", "chatgpt-answer": "A. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "The video showcases a man performing exercise while wind turbines rotate in the background. The man is seen wearing a suit and tie, and he is seen doing exercise on a playground. The video also features a man doing exercise on a playground and a man doing exercise on a field. The video captures the man's movements as he performs exercise, and the wind turbines rotate in the background, creating a serene and peaceful atmosphere. The video is a perfect representation of the man's dedication towards his fitness routine, and the wind turbines add a touch of nature to the video", "gt-answer": "C. Wind turbines are rotating followed by a man doing exercise", "rating": 0 } ] }, "1067268403_1064645467_2": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the man is doing exercise first, followed by wind turbines rotating in the background.", "chatgpt-answer": "B. A man doing exercise followed by wind turbines rotating", "video-llm-prediction": "The video shows a man doing exercise in a park, followed by wind turbines rotating in the background. The man continues to exercise while the wind turbines keep rotating.", "gt-answer": "B. A man doing exercise followed by wind turbines rotating", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is performing exercises in a park, while the wind turbines are rotating in the background. Therefore, the order of events in the video is that the wind turbines are rotating followed by the man doing exercise.", "chatgpt-answer": "C. Wind turbines are rotating followed by a man doing exercise", "video-llm-prediction": "The video showcases a man performing exercises in a park, with wind turbines rotating in the background. The man is seen doing push-ups and stretching, while the wind turbines are rotating in the distance. The video captures the man's physical activity and the natural beauty of the park. The wind turbines add a sense of motion and energy to the scene, creating a visually appealing contrast between the man's exercise routine and the surrounding environment. Overall, the video highlights the importance of physical activity and the beauty of nature.", "gt-answer": "B. A man doing exercise followed by wind turbines rotating", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"A man is seen doing exercise while wind turbines are rotating in the background\", indicating that both the man doing exercise and the wind turbines rotating are happening at the same time.", "chatgpt-answer": "A. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "A man is seen doing exercise while wind turbines are rotating in the background. The video showcases the beauty of nature and the importance of physical activity.", "gt-answer": "B. A man doing exercise followed by wind turbines rotating", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen exercising in a park and the wind turbines are rotating concurrently. This implies that both events are happening at the same time.", "chatgpt-answer": "A. A man doing exercise and wind turbines rotating concurrently", "video-llm-prediction": "The video showcases a man engaging in physical activity while the wind turbines rotate in the background. The man is seen exercising in a park, and the wind turbines are rotating concurrently. The video emphasizes the importance of physical activity and the beauty of nature.", "gt-answer": "B. A man doing exercise followed by wind turbines rotating", "rating": 0 } ] }, "1082268005_1063373449_0": { "order": [ { "chatgpt-reasoning": "The video description provides a clear sequence of events. First, the video shows the process of assembling a globe using toy bricks. Then, it shows the process of disassembling the globe using viruses.", "chatgpt-answer": "C. viruses are dissolving and then planet earth is assembling from toy bricks", "video-llm-prediction": "The video showcases the process of assembling a globe using toy bricks and then the process of disassembling it using viruses. The video starts with a white screen displaying the title of the video. The scene then changes to a blue screen displaying the title of the video. The video then shows a globe being assembled using toy bricks. The scene then changes to a white screen displaying the title of the video. The video then shows the process of disassembling the globe using viruses. The scene then changes to a blue screen displaying the title of the video. The video ends with", "gt-answer": "A. The events are happening simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the process of assembling a model of the Earth from toy bricks is showcased first, followed by the disintegration of the model due to viruses. This indicates that the correct sequence is \"planet earth is assembling from toy bricks and then viruses are dissolving.\"", "chatgpt-answer": "B. planet earth is assembling from toy bricks and then viruses are dissolving", "video-llm-prediction": "The video showcases the process of assembling a model of the Earth from toy bricks, followed by the disintegration of the model due to viruses. The video highlights the importance of vaccination and the potential consequences of not getting vaccinated.", "gt-answer": "A. The events are happening simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states the order of events: first, the blue and yellow globe is assembling from toy bricks, and then the bricks are being dissolved by viruses.", "chatgpt-answer": "C. viruses are dissolving and then planet earth is assembling from toy bricks", "video-llm-prediction": "The video shows a blue and yellow globe assembling from toy bricks, and then the bricks are being dissolved by viruses.", "gt-answer": "A. The events are happening simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the process of assembling a globe from toy bricks is followed by the disintegration of the bricks. Then, it transitions to the process of the Earth reassembling from the disintegrated bricks. Therefore, the correct order of events is \"planet earth is assembling from toy bricks and then viruses are dissolving.\"", "chatgpt-answer": "B. planet earth is assembling from toy bricks and then viruses are dissolving.", "video-llm-prediction": "The video showcases the process of assembling a globe from toy bricks, followed by the disintegration of the bricks. The video then transitions to the process of the earth reassembling from the disintegrated bricks.", "gt-answer": "A. The events are happening simultaneously", "rating": 0 } ] }, "1082268005_1063373449_1": { "order": [ { "chatgpt-reasoning": "The video description states that the globe is assembling from toy bricks and simultaneously, the virus is dissolving. This indicates that both events are happening at the same time.", "chatgpt-answer": "C. The events are happening simultaneously", "video-llm-prediction": "The video starts with a close-up shot of a cell, and then it transitions to a shot of a globe. The globe then starts to assemble from toy bricks, and the video shows the process of the assembly. As the globe is assembling, the video shows the process of the virus dissolving. The video then shows the process of the virus dissolving and the globe assembling simultaneously. The video ends with a shot of the globe.", "gt-answer": "A. planet earth is assembling from toy bricks and then viruses are dissolving", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the earth is seen assembling from toy bricks first, followed by the appearance of viruses that begin to dissolve. Therefore, option A is the correct answer.", "chatgpt-answer": "A. planet earth is assembling from toy bricks and then viruses are dissolving", "video-llm-prediction": "The video showcases the process of the earth's formation and the subsequent evolution of viruses. The earth is seen assembling from toy bricks, followed by the appearance of viruses that begin to dissolve. The video then depicts the simultaneous occurrence of these events.", "gt-answer": "A. planet earth is assembling from toy bricks and then viruses are dissolving", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the events of assembling planet earth from toy bricks and dissolving viruses are happening simultaneously.", "chatgpt-answer": "C. The events are happening simultaneously", "video-llm-prediction": "The video shows a planet earth assembling from toy bricks and then viruses are dissolving. The events are happening simultaneously.", "gt-answer": "A. planet earth is assembling from toy bricks and then viruses are dissolving", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the process of the earth's formation from toy bricks is showcased first, followed by the subsequent dissolving of viruses. It also highlights that these events are happening simultaneously.", "chatgpt-answer": "C. The events are happening simultaneously", "video-llm-prediction": "The video showcases the process of the earth's formation from toy bricks and the subsequent dissolving of viruses. The video also highlights the simultaneous occurrence of these events.", "gt-answer": "A. planet earth is assembling from toy bricks and then viruses are dissolving", "rating": 0 } ] }, "1082268005_1063373449_2": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the events of a virus dissolving and the assembly of the planet earth from toy bricks are happening simultaneously.", "chatgpt-answer": "B. The events are happening simultaneously", "video-llm-prediction": "The video showcases the process of a virus dissolving and then the assembly of the planet earth from toy bricks. The video also depicts the events happening simultaneously.", "gt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the order of events is as follows: first, the virus is dissolving, and then the earth is assembled from toy bricks. The video ends with the earth being assembled from toy bricks.", "chatgpt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "video-llm-prediction": "The video showcases the process of a virus dissolving and the subsequent assembly of the earth from toy bricks. The video starts with the virus dissolving, and then the earth is assembled from toy bricks. The video then shows the earth being assembled from toy bricks, and then the virus is dissolving. The video ends with the earth being assembled from toy bricks.", "gt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the process of a virus breaking down and the earth assembling from toy bricks is happening simultaneously, which means that neither one happens before the other.", "chatgpt-answer": "B. The events are happening simultaneously", "video-llm-prediction": "The video shows the process of a virus breaking down and the earth assembling from toy bricks. The video also shows the process happening simultaneously.", "gt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with a close-up of a virus, which then leads to the assembly of the earth model. It then shows the virus breaking down and ends with the earth model being shown again. This indicates that the order of events in the video is viruses dissolving first and then planet earth assembling from toy bricks.", "chatgpt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "video-llm-prediction": "The video showcases the process of a virus breaking down and the assembly of a toy model of the earth. The video starts with a close-up of a virus, which then leads to the assembly of the earth model. The video then shows the virus breaking down, and the earth model is shown again. The video ends with the earth model being shown again.", "gt-answer": "A. viruses are dissolving and then planet earth is assembling from toy bricks", "rating": 1 } ] }, "1060403198_1049965795_0": { "order": [ { "chatgpt-reasoning": "The video description mentions that a light bulb is shown lighting up, followed by a tree growing up. Then it shows the tree growing up and a light bulb lighting up at the same time. This indicates that the correct answer is that both events happen at the same time.", "chatgpt-answer": "C. Both events happen at the same time", "video-llm-prediction": "A light bulb is shown lighting up, followed by a tree growing up. The video then shows the tree growing up and a light bulb lighting up at the same time.", "gt-answer": "C. Both events happen at the same time", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with a close-up shot of a light bulb, then transitions to a tree growing up while the light bulb is lighting up. It ends with a close-up shot of the light bulb. This indicates that the light bulb is lighting up before the tree starts growing up.", "chatgpt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "The video showcases a tree growing up while a light bulb is lighting up. The video starts with a close-up shot of a light bulb, and then it transitions to a tree growing up. The video then shows the tree growing up while the light bulb is lighting up. The video ends with a close-up shot of the light bulb. The video captures the growth of the tree and the lighting up of the light bulb, creating a visually appealing scene.", "gt-answer": "C. Both events happen at the same time", "rating": 0 }, { "chatgpt-reasoning": "According to the video description, it first mentions that a light bulb is lighting up and then states that the tree is growing up. This implies that the events happen in sequence with the light bulb lighting up first and then the tree growing up.", "chatgpt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A light bulb is lighting up and then the tree is growing up.", "gt-answer": "C. Both events happen at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the light bulb is seen lighting up first, followed by the tree growing up. This indicates a sequential order of events.", "chatgpt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A light bulb is seen lighting up, followed by a tree growing up. The video showcases the growth of the tree, with the light bulb providing a source of light. The video captures the beauty of nature and the power of light.", "gt-answer": "C. Both events happen at the same time", "rating": 0 } ] }, "1060403198_1049965795_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the tree is growing up first, and then a light bulb is shown lighting up. This sequence is repeated twice, with the tree growing up first followed by the light bulb lighting up. Therefore, the correct answer is A. The tree is growing up and then a light bulb is lighting up.", "chatgpt-answer": "A. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "The video starts with a tree growing up, and then a light bulb is shown lighting up. The video then shows the tree growing up again, and the light bulb is shown lighting up again. The video ends with the tree growing up and the light bulb lighting up.", "gt-answer": "A. The tree is growing up and then a light bulb is lighting up", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the tree is growing up first, and then the light bulb is lighting up. It also mentions a close-up shot of the light bulb, indicating that the focus shifts from the tree to the light bulb.", "chatgpt-answer": "A. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "The video showcases a tree growing up and then a light bulb lighting up. The video also features a close-up shot of the light bulb.", "gt-answer": "A. The tree is growing up and then a light bulb is lighting up", "rating": 1 }, { "chatgpt-reasoning": "The video description states that first a light bulb is shown in the video, and then a tree is shown growing up. This indicates that the events happen sequentially, with the light bulb lighting up before the tree grows up.", "chatgpt-answer": "C. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A light bulb is shown in the video, and then a tree is shown growing up.", "gt-answer": "A. The tree is growing up and then a light bulb is lighting up", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the tree is growing up first and then a light bulb is lighting up. There is no mention of both events happening at the same time or the light bulb lighting up first before the tree grows.", "chatgpt-answer": "A. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "The video showcases a tree growing up and then a light bulb lighting up. The video also features a close-up of the light bulb.", "gt-answer": "A. The tree is growing up and then a light bulb is lighting up", "rating": 1 } ] }, "1060403198_1049965795_2": { "order": [ { "chatgpt-reasoning": "The video description mentions that the video starts with a close-up shot of a light bulb being lit up, followed by a shot of a tree growing up. Then it shows the tree growing up and the light bulb being lit up simultaneously. The video ends with the tree growing up. Therefore, the correct order of events in the video is that the light bulb is lighting up and then the tree is growing up.", "chatgpt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "The video starts with a close-up shot of a light bulb being lit up, followed by a shot of a tree growing up. The video then shows the tree growing up and the light bulb being lit up simultaneously. The video ends with the tree growing up.", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the tree is seen growing up in the beginning, and then the light bulb is shown lighting up. This indicates that the tree growing up happens before the light bulb lighting up.", "chatgpt-answer": "B. The tree is growing up and then a light bulb is lighting up", "video-llm-prediction": "The video showcases a tree growing up while a light bulb is lighting up. The tree is seen growing up in the beginning, and then the light bulb is shown lighting up. The video captures the growth of the tree and the lighting up of the bulb simultaneously.", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the light bulb is lighting up first, followed by the tree growing up.", "chatgpt-answer": "A. A light bulb is lighting up and then the tree is growing up", "video-llm-prediction": "A light bulb is lighting up and then the tree is growing up.", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the light bulb is lighting up first, followed by the tree growing up. Therefore, the correct answer is A. A light bulb is lighting up and then the tree is growing up.", "chatgpt-answer": "A. A light bulb is lighting up and then the tree is growing up.", "video-llm-prediction": "A light bulb is lighting up, and then the tree is growing up. The video showcases the growth of a tree, starting from a small sapling to a full-grown tree. The light bulb's illumination adds a touch of magic to the scene, emphasizing the tree's growth. The video captures the beauty of nature and the process of growth, making it an excellent visual representation of the passage of time.", "gt-answer": "A. A light bulb is lighting up and then the tree is growing up", "rating": 1 } ] }, "1091143117_1094219575_0": { "order": [ { "chatgpt-reasoning": "The video description mentions that the video starts with an eye opening, followed by a flower wilting. Then, it shows the wilting flower and the eye opening simultaneously. Finally, the video ends with the flower wilting. Based on this information, we can conclude that the correct order of events in the video is option A.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video starts with an eye opening, and then a flower wilting. The video then shows the wilting flower, and the eye opening simultaneously. The video ends with the flower wilting.", "gt-answer": "C. Both events happen simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the opening of the eye is the first event to occur, followed by the wilting of the flower. It also mentions that the video provides a visual representation of these two events happening simultaneously. Therefore, the correct answer is:", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting.", "video-llm-prediction": "The video showcases the opening of an eye and the wilting of a flower. The opening of the eye is the first event to occur, followed by the wilting of the flower. The video provides a visual representation of these two events happening simultaneously.", "gt-answer": "C. Both events happen simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description states that both the flower wilting and the eye opening are happening simultaneously.", "chatgpt-answer": "C. Both events happen simultaneously", "video-llm-prediction": "The video shows a flower wilting and an eye opening simultaneously.", "gt-answer": "C. Both events happen simultaneously", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the opening of the eye is the first event, followed by the wilting of the flower. This implies that the eye is opening first, and then the flower is wilting.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video showcases the opening of an eye and the wilting of a flower simultaneously. The opening of the eye is the first event, followed by the wilting of the flower.", "gt-answer": "C. Both events happen simultaneously", "rating": 0 } ] }, "1091143117_1094219575_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the eye opening is shown first, followed by the wilting of the flower. There is no mention of the events happening simultaneously or the flower wilting before the eye opens.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video starts with an eye opening, and then a flower wilting. The video then shows the flower wilting first, and then the eye opening.", "gt-answer": "A. An eye is opening first, then a flower is wilting", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with an eye opening and then a flower wilting. It specifically mentions the order in which the events occur.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video starts with an eye opening, and then a flower wilting. The video showcases the process of a flower wilting, highlighting the natural aging process of flowers. The camera captures the wilting process from different angles, providing a detailed view of the flower's decline. The video emphasizes the beauty of the flower in its prime and the inevitable decline of all things. The video is a reminder of the fleeting nature of life and the importance of cherishing the moments.", "gt-answer": "A. An eye is opening first, then a flower is wilting", "rating": 1 }, { "chatgpt-reasoning": "The video description states that both the wilting of the flower and the opening of an eye are happening simultaneously.", "chatgpt-answer": "B. Both events happen simultaneously", "video-llm-prediction": "The video shows a wilting flower and an eye opening simultaneously.", "gt-answer": "A. An eye is opening first, then a flower is wilting", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with an eye opening, followed by a flower wilting. It then shows the flower wilting first, and then the eye opening. Therefore, the correct answer is option A.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video starts with an eye opening, followed by a flower wilting. The video then shows the flower wilting first, and then the eye opening. The video captures the natural process of a flower wilting and the opening of an eye, showcasing the beauty of nature.", "gt-answer": "A. An eye is opening first, then a flower is wilting", "rating": 1 } ] }, "1091143117_1094219575_2": { "order": [ { "chatgpt-reasoning": "The video description explicitly states that the video showcases a close-up of a flower wilting, followed by an eye opening. Therefore, the correct order of events in the video is C. A flower is wilting first, then an eye is opening.", "chatgpt-answer": "C. A flower is wilting first, then an eye is opening", "video-llm-prediction": "The video showcases a close-up of a flower wilting, followed by an eye opening. The video emphasizes the beauty of the flower and the delicate nature of life. The wilting of the flower symbolizes the impermanence of all things, while the opening of the eye represents the beauty of life and the importance of appreciating the small things. The video is a reminder to cherish the moments and appreciate the beauty of life.", "gt-answer": "C. A flower is wilting first, then an eye is opening", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the eye opening symbolizes the beginning of a new day, while the wilting flower represents the end of a day. It also states that both events happen simultaneously. This implies that the correct answer should be the one where both events happen at the same time.", "chatgpt-answer": "B. Both events happen simultaneously", "video-llm-prediction": "The video begins with an eye opening, and then a flower wilting. The video showcases the beauty of nature and the delicate balance of life. The eye opening could symbolize the beginning of a new day, while the wilting flower represents the end of a day. The video captures the fleeting nature of life and the beauty of the world around us. The eye opening and wilting flower are both natural events that happen simultaneously, and the video showcases the beauty of both. The video is a reminder of the beauty of the world around us and the importance of appreciating it.", "gt-answer": "C. A flower is wilting first, then an eye is opening", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the eye opening happens first, followed by the flower wilting.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video starts with an eye opening, and then a flower wilting. The video showcases the beauty of nature and the passage of time.", "gt-answer": "C. A flower is wilting first, then an eye is opening", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video starts with an eye opening, and then a flower wilting.", "chatgpt-answer": "A. An eye is opening first, then a flower is wilting", "video-llm-prediction": "The video starts with an eye opening, and then a flower wilting. The video showcases the beauty of nature and the delicate balance of life. The eye opening could symbolize the beginning of a new day, while the wilting flower represents the end of a day. The video captures the fleeting nature of life and the beauty of the world around us.", "gt-answer": "C. A flower is wilting first, then an eye is opening", "rating": 0 } ] }, "1086105089_1085910917_0": { "order": [ { "chatgpt-reasoning": "The video description states that the woman is drinking water while a building is being constructed in the background. This indicates that the construction of the building is happening before the woman starts drinking water.", "chatgpt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "The video shows a woman drinking water while a building is being constructed in the background.", "gt-answer": "C. Both events happen simultaneously.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video showcases the construction of a building first, and then it shows a woman drinking water. It mentions that the woman's actions are a reminder of the importance of staying hydrated during physical activities, which implies that the construction is happening before the woman starts drinking water.", "chatgpt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "The video showcases the construction of a building while a woman drinks water. The woman is seen holding a glass of water and drinking it while the building is being constructed in the background. The video captures the contrast between the woman's peaceful activity and the hustle and bustle of the construction site. The woman's actions are a reminder of the importance of staying hydrated, especially during physical activities. The video highlights the beauty of nature and the importance of preserving it. The woman's actions are a reminder of the importance of staying hydrated, especially during", "gt-answer": "C. Both events happen simultaneously.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is drinking water \"while\" a building is being constructed in the background. This implies that the woman drinking water and the construction of the building are happening at the same time.", "chatgpt-answer": "C. Both events happen simultaneously.", "video-llm-prediction": "A woman drinks water while a building is being constructed in the background.", "gt-answer": "C. Both events happen simultaneously.", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is drinking water first, and then the building is being constructed in the background. Therefore, the correct order of events is that first, a woman is drinking water; then, a building is being constructed.", "chatgpt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "The video showcases a woman drinking water while a building is being constructed in the background. The woman takes a sip of water and sets the glass down on the counter. The video emphasizes the importance of staying hydrated, especially during physical activities or hot weather. The building being constructed in the background adds a sense of progress and development, highlighting the importance of hard work and dedication. Overall, the video serves as a reminder to stay hydrated and work hard towards achieving our goals.", "gt-answer": "C. Both events happen simultaneously.", "rating": 0 } ] }, "1086105089_1085910917_1": { "order": [ { "chatgpt-reasoning": "The video description clearly mentions that the video starts with a woman drinking water and then shows a building being constructed. It states that the woman is enjoying her drink while the building is being built. Therefore, the correct answer is C. First, a woman is drinking water; then, a building is being constructed.", "chatgpt-answer": "C. First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "The video starts with a woman drinking water, and then it shows a building being constructed. The woman seems to be enjoying her drink while the building is being built. The video seems to be showcasing the contrast between the woman's simple act of drinking water and the complex process of building a building. The video highlights the importance of staying hydrated and the beauty of architecture.", "gt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"The woman is seen holding a glass of water and taking a sip, while the building is being built.\" This indicates that first the building is being constructed, and then the woman is drinking water.", "chatgpt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "video-llm-prediction": "The video showcases a woman drinking water while a building is being constructed in the background. The woman is seen holding a glass of water and taking a sip, while the building is being built. The video captures the serene and peaceful atmosphere of the scene, with the sound of the water being the only audible noise. The woman's actions are simple yet powerful, as she takes a moment to drink water and rehydrate herself. The video is a reminder of the importance of staying hydrated, especially in hot weather or during physical activity. The building in the background adds a sense of", "gt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that a woman is seen drinking water while a building is being constructed in the background. This implies that the events are happening simultaneously.", "chatgpt-answer": "B. Both events happen simultaneously.", "video-llm-prediction": "A woman is seen drinking water while a building is being constructed in the background.", "gt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that there is a woman drinking water \"while\" a building is being constructed in the background. This implies that the construction of the building is happening concurrently with the woman drinking water.", "chatgpt-answer": "B. Both events happen simultaneously.", "video-llm-prediction": "A woman is seen drinking water while a building is being constructed in the background.", "gt-answer": "A. First, a building is being constructed; then, a woman is drinking water.", "rating": 0 } ] }, "1086105089_1085910917_2": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the woman is seen drinking water while a building is being constructed in the background. This implies that the event of the woman drinking water happens first, followed by the event of the building being constructed.", "chatgpt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "The video shows a woman drinking water while a building is being constructed in the background. The woman is seen holding a glass of water and taking a sip. The video also shows the building being constructed, with a crane visible in the background. The woman seems to be enjoying her drink while the construction work continues. The video captures the contrast between the woman's peaceful activity and the bustling construction work happening in the background. Overall, the video provides a glimpse into the daily life of a woman in a city where construction work is a common sight.", "gt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is seen holding a glass of water and taking a sip, while the building is being constructed in the background. This indicates that the woman drinking water happens before the building construction.", "chatgpt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "video-llm-prediction": "The video showcases the construction of a building while a woman drinks water. The woman is seen holding a glass of water and taking a sip, while the building is being constructed in the background. The video captures the contrast between the woman's simple action of drinking water and the complex process of building a structure. The video highlights the importance of staying hydrated, especially during physical activities or hot weather. The video also emphasizes the significance of construction and the efforts required to build a structure. Overall, the video is a visual representation of the importance of staying hydrated and the significance of", "gt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the woman is drinking water \"while\" a building is being constructed. This implies that both events are happening at the same time.", "chatgpt-answer": "C. Both events happen simultaneously.", "video-llm-prediction": "A woman drinks water while a building is being constructed.", "gt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"A woman is seen drinking water while a building is being constructed in the background.\" This indicates that the events are happening simultaneously.", "chatgpt-answer": "C. Both events happen simultaneously.", "video-llm-prediction": "A woman is seen drinking water while a building is being constructed in the background.", "gt-answer": "B. First, a woman is drinking water; then, a building is being constructed.", "rating": 0 } ] }, "1034736653_1043054206_0": { "order": [ { "chatgpt-reasoning": "The video description states that the women running and the cars racing are happening simultaneously.", "chatgpt-answer": "B. They happen simultaneously", "video-llm-prediction": "The video shows a group of women running on a track, followed by cars racing on the same track. The video captures the women running and the cars racing simultaneously.", "gt-answer": "B. They happen simultaneously", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the video captures the women running and the cars racing simultaneously.", "chatgpt-answer": "B. They happen simultaneously", "video-llm-prediction": "The video showcases a group of women running on a track, followed by cars racing on the same track. The video captures the women running and the cars racing simultaneously, creating a visually stunning scene. The video highlights the beauty of the track and the athleticism of the women running. The cars racing add an element of excitement and speed to the video, making it a thrilling watch. Overall, the video is a captivating display of athleticism and speed, with the women running and the cars racing creating a visually stunning scene.", "gt-answer": "B. They happen simultaneously", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the women are seen running in a line, with one woman leading the pack and the cars racing on the side of the track, with some cars passing by the women. This indicates that the women start running first, followed by the cars racing.", "chatgpt-answer": "A. Women running, then cars racing", "video-llm-prediction": "The video shows a group of women running on a track while cars race on the side. The women are seen running in the same direction as the cars. The video captures the women running in a line, with one woman leading the pack. The cars are seen racing on the side of the track, with some cars passing by the women. The video ends with the women still running on the track.", "gt-answer": "B. They happen simultaneously", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the events showcased in the video are the women running on a track followed by a scene of cars racing on the same track. Therefore, the correct order of events in the video is Women running, then cars racing.", "chatgpt-answer": "A. Women running, then cars racing", "video-llm-prediction": "The video showcases a group of women running on a track, followed by a scene of cars racing on the same track. The video captures the women's athleticism and the cars' speed and agility. The video emphasizes the contrast between the women's running and the cars' racing, highlighting the different speeds and movements. The video's purpose is to showcase the women's running skills and the cars' racing skills, and it does so effectively.", "gt-answer": "B. They happen simultaneously", "rating": 0 } ] }, "1034736653_1043054206_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the video starts with a woman running on a track, followed by several other women running. Then, it shifts to cars racing on a highway. Afterward, it shows the women running again, followed by the cars racing. Finally, the video ends with the women running again. The events occur in the order of Women running, then cars racing.", "chatgpt-answer": "B. Women running, then cars racing", "video-llm-prediction": "The video starts with a woman running on a track, followed by several other women running. The scene then shifts to cars racing on a highway. The video then shows the women running again, followed by the cars racing. The video ends with the women running again. The video showcases the beauty of nature and the excitement of racing. The video is a perfect blend of nature and technology, making it a must-watch for all car enthusiasts.", "gt-answer": "B. Women running, then cars racing", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the women's running and the cars' racing are happening simultaneously.", "chatgpt-answer": "C. They happen simultaneously", "video-llm-prediction": "The video showcases a group of women running on a track, followed by a scene of cars racing on the same track. The video captures the energy and excitement of both activities, with the women's running and the cars' racing happening simultaneously. The video highlights the beauty of nature, with the track surrounded by mountains and trees. The video also features a yellow sports car driving on a highway, adding to the overall sense of adventure and excitement.", "gt-answer": "B. Women running, then cars racing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the video captures the women running and the cars racing simultaneously.", "chatgpt-answer": "C. They happen simultaneously", "video-llm-prediction": "The video shows a group of women running on a track while cars race on the road beside them. The video captures the women running and the cars racing simultaneously.", "gt-answer": "B. Women running, then cars racing", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the events of women running and cars racing down a highway happen simultaneously.", "chatgpt-answer": "C. They happen simultaneously", "video-llm-prediction": "The video showcases a group of women running on a track, followed by a scene of cars racing down a highway. The two events are shown to happen simultaneously, creating a sense of speed and excitement. The video captures the energy and athleticism of both the runners and the drivers, as they push themselves to the limit. The women's determination and focus are evident as they race towards the finish line, while the cars' power and agility are on full display as they navigate the highways. Overall, the video is a thrilling display of physical prowess and the power of human achievement.", "gt-answer": "B. Women running, then cars racing", "rating": 0 } ] }, "1034736653_1043054206_2": { "order": [ { "chatgpt-reasoning": "The video description mentions that the video starts with a yellow sports car driving down a highway, followed by a group of women running on a track. This indicates that the order of events is cars racing, then women running.", "chatgpt-answer": "C. Cars racing, then women running", "video-llm-prediction": "The video starts with a yellow sports car driving down a highway, followed by a group of women running on a track. The women are seen running in slow motion, and the video captures their movements in detail. The scene then shifts to a group of cars racing down the same highway, with the women running alongside them. The video captures the excitement and energy of both the car race and the women's run, showcasing the beauty of nature and the thrill of competition.", "gt-answer": "C. Cars racing, then women running", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the women are running and jumping into a pile of sand, while the cars race by. This suggests that the women running event happens before the cars racing event.", "chatgpt-answer": "B. Women running, then cars racing", "video-llm-prediction": "The video showcases a group of women running on a track, followed by cars racing on the same track. The video captures the women running and jumping into a pile of sand, while the cars race by. The video also shows the women running on a track with a car driving by. Overall, the video highlights the women's athletic abilities and the cars' speed and agility.", "gt-answer": "C. Cars racing, then women running", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the group of women is running on a track, followed by a race between two cars. This indicates that the events occur in the order of women running first and then cars racing.", "chatgpt-answer": "B. Women running, then cars racing", "video-llm-prediction": "The video shows a group of women running on a track, followed by a race between two cars. The video captures the excitement and energy of the race, with the women running with determination and the cars speeding around the track. The video also showcases the beauty of the surrounding landscape, with the track surrounded by lush greenery and stunning views. Overall, the video is a thrilling and visually stunning display of athleticism and speed.", "gt-answer": "C. Cars racing, then women running", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the women running and the cars racing occur simultaneously.", "chatgpt-answer": "A. They happen simultaneously", "video-llm-prediction": "The video showcases a group of women running on a track, followed by cars racing on the same track. The video captures the women running and the cars racing simultaneously, creating a visually appealing scene. The video highlights the women's athleticism and the cars' speed and agility. The video's focus is on the women's running and the cars' racing, creating a sense of excitement and energy.", "gt-answer": "C. Cars racing, then women running", "rating": 0 } ] }, "1086423566_1094782389_0": { "order": [ { "chatgpt-reasoning": "The video description states that the dog is giving a high five to a woman first, and then the woman adds food into a bowl. This implies that the correct chronological order of events is: A dog is giving a high five to a woman, and then foods are added into a bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then the woman adds food into a bowl. The dog is seen eating the food from the bowl.", "gt-answer": "B. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the dog gives a high five first, followed by adding food into a bowl, and then the woman feeds the dog.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The woman then feeds the dog with the food.", "gt-answer": "B. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that first, a dog is giving a high five to a woman, and then foods are added into a bowl. Therefore, the correct chronological order of the events in the video is: A dog is giving a high five to a woman, and then foods are added into a bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl.", "gt-answer": "B. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dog is seen giving a high five to a woman, and then foods are added into a bowl. This indicates that the correct chronological order of events in the video is for the dog to give a high five first, followed by the addition of food into the bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The video showcases the woman preparing a meal for her dog, and the dog is excited to receive the meal. The video is a heartwarming display of the bond between a dog and its owner.", "gt-answer": "B. Foods are added into a bowl, while at the same time a dog is giving a high five to a woman", "rating": 0 } ] }, "1086423566_1094782389_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the dog first gives a high five to a woman, and then foods are added into a bowl. The last event mentioned is that the dog is seen eating the food from the bowl. So the correct chronological order of events is A. A dog is giving a high five to a woman, and then foods are added into a bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The dog is then seen eating the food from the bowl.", "gt-answer": "C. Foods are added into a bowl, and then a dog is giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the correct chronological order of events in the video is as follows: First, a dog is seen giving a high five to a woman. Then, foods are added into a bowl. Finally, the woman feeds the dog with a spoon and the dog licks the spoon.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The woman then feeds the dog with a spoon, and the dog licks the spoon. The video showcases a heartwarming moment between a dog and its owner.", "gt-answer": "C. Foods are added into a bowl, and then a dog is giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the dog is seen giving a high five to a woman first, and then foods are added into a bowl. Finally, the dog is seen eating the food. This indicates that the correct chronological order of events in the video is: A dog is giving a high five to a woman, and then foods are added into a bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The dog is then seen eating the food.", "gt-answer": "C. Foods are added into a bowl, and then a dog is giving a high five to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the dog is seen giving a high five to a woman first, and then foods are added into a bowl. Finally, the woman feeds the dog with a spoon. Therefore, the correct chronological order of events in the video is: A dog is giving a high five to a woman, and then foods are added into a bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The woman then feeds the dog with a spoon.", "gt-answer": "C. Foods are added into a bowl, and then a dog is giving a high five to a woman", "rating": 0 } ] }, "1086423566_1094782389_2": { "order": [ { "chatgpt-reasoning": "The video description states that the dog is giving a high five to a woman first, followed by adding foods into a bowl, and then the woman mixing the foods in the bowl. Therefore, option A is the correct chronological order.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The woman then proceeds to mix the foods in the bowl.", "gt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the dog gives a high five to a woman first, then foods are added into a bowl, and finally the woman mixes the foods in the bowl. Therefore, the correct chronological order is A.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is giving a high five to a woman, and then foods are added into a bowl. The woman then mixes the foods in the bowl.", "gt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that first, a dog is seen giving a high five to a woman, and then foods are added into a bowl. Finally, the woman mixes the foods in the bowl. Therefore, the correct chronological order of the events in the video is A.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The woman then mixes the foods in the bowl.", "gt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, the correct chronological order of events is that the dog is seen giving a high five to a woman first, and then foods are added into a bowl. This order implies that the action of giving a high five comes before the action of adding food to the bowl.", "chatgpt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "video-llm-prediction": "A dog is seen giving a high five to a woman, and then foods are added into a bowl. The video showcases the process of making a healthy and delicious meal.", "gt-answer": "A. A dog is giving a high five to a woman, and then foods are added into a bowl", "rating": 1 } ] }, "1053758117_1055413730_0": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the digital brain is spinning first, followed by the earth spinning. Therefore, the correct answer is A. The digital brain is spinning and then the earth is spinning.", "chatgpt-answer": "A. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "The video showcases a digital brain spinning, followed by the earth spinning. The video then displays the earth spinning while the digital brain is spinning.", "gt-answer": "B. Both events occur at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the digital brain is spinning first, followed by the earth spinning.", "chatgpt-answer": "A. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "The video showcases a digital brain spinning, followed by the earth spinning. The video emphasizes the interconnectedness of the digital and natural worlds.", "gt-answer": "B. Both events occur at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the digital brain is spinning followed by the earth spinning. Therefore, the correct answer is option A.", "chatgpt-answer": "A. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "The video shows a digital brain spinning, followed by the earth spinning. The video emphasizes the connection between the digital brain and the earth's rotation.", "gt-answer": "B. Both events occur at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that first the digital brain is spinning, followed by the earth spinning.", "chatgpt-answer": "A. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "The video showcases a digital brain spinning, followed by the earth spinning. The video highlights the interconnectedness of the digital and physical worlds.", "gt-answer": "B. Both events occur at the same time", "rating": 0 } ] }, "1053758117_1055413730_1": { "order": [ { "chatgpt-reasoning": "The video description mentions that the digital brain is spinning first and then the earth is spinning. It also states that there is a large explosion and a large light in the sky, which are not mentioned in any other choices.", "chatgpt-answer": "C. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "The video shows a digital brain spinning and then the earth spinning. The video also shows a large explosion and a large light in the sky.", "gt-answer": "C. The digital brain is spinning and then the earth is spinning.", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically states that the earth is spinning first, followed by the digital brain spinning faster than the earth.", "chatgpt-answer": "A. The earth is spinning and then the digital brain is spinning.", "video-llm-prediction": "The video showcases the rotation of the earth and the digital brain, with the latter spinning faster than the former. The video also features a spinning digital brain, which spins faster than the earth.", "gt-answer": "C. The digital brain is spinning and then the earth is spinning.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"The video shows the earth spinning and then the digital brain spinning\", indicating a sequential order of events.", "chatgpt-answer": "A. The earth is spinning and then the digital brain is spinning.", "video-llm-prediction": "The video shows the earth spinning and then the digital brain spinning.", "gt-answer": "C. The digital brain is spinning and then the earth is spinning.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that \"The earth is seen spinning first, followed by the digital brain spinning.\"", "chatgpt-answer": "A. The earth is spinning and then the digital brain is spinning.", "video-llm-prediction": "The video showcases the spinning of the earth and the digital brain. The earth is seen spinning first, followed by the digital brain spinning. The video captures the beauty of the earth and the complexity of the digital brain.", "gt-answer": "C. The digital brain is spinning and then the earth is spinning.", "rating": 0 } ] }, "1053758117_1055413730_2": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the video begins with a spinning digital brain, followed by a spinning earth. Then, it shows a series of digital brains spinning and a series of spinning planets. Finally, the video ends with a spinning digital brain.", "chatgpt-answer": "B. The digital brain is spinning and then the earth is spinning.", "video-llm-prediction": "The video begins with a spinning digital brain, which then transitions to a spinning earth. The video then shows a series of digital brains spinning, followed by a series of spinning planets. The video ends with a spinning digital brain.", "gt-answer": "C. The earth is spinning and then the digital brain is spinning.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that both the digital brain and the earth are spinning in sync with each other, implying that the events occur at the same time.", "chatgpt-answer": "A. Both events occur at the same time", "video-llm-prediction": "The video showcases a spinning digital brain and a spinning earth, both of which are in sync with each other. The video also features a spinning globe, which is a common symbol of the earth. The video's focus is on the relationship between the earth and the digital brain, with the earth spinning and the digital brain spinning in harmony.", "gt-answer": "C. The earth is spinning and then the digital brain is spinning.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the earth is shown spinning first, and then the digital brain is shown spinning. This indicates a clear sequential order of events.", "chatgpt-answer": "C. The earth is spinning and then the digital brain is spinning.", "video-llm-prediction": "The video shows a spinning earth and a spinning digital brain. The earth is shown spinning first, and then the digital brain is shown spinning.", "gt-answer": "C. The earth is spinning and then the digital brain is spinning.", "rating": 1 }, { "chatgpt-reasoning": "The video description states that both the spinning digital brain and the spinning earth are happening simultaneously.", "chatgpt-answer": "A. Both events occur at the same time", "video-llm-prediction": "The video showcases a spinning digital brain and a spinning earth, both spinning simultaneously.", "gt-answer": "C. The earth is spinning and then the digital brain is spinning.", "rating": 0 } ] }, "1076877854_1073914229_0": { "order": [ { "chatgpt-reasoning": "The video description states that the train passes by a field of crops while robotic arms work in the background, and then transitions to the robotic arms working in the field of crops. Therefore, the correct order of events is that the trains are driving first, followed by the robotic arms working.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases a train passing by a field of crops while robotic arms work in the background. The video then transitions to the robotic arms working in the field of crops.", "gt-answer": "B. they happen at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the train passes by a field of green plants first, then there is a demonstration of robotic arms working in a factory, and finally, it transitions back to the train driving down the tracks. So the correct order of events is: trains are driving, then robotic arms are working.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases a train passing by a field of green plants, followed by a demonstration of robotic arms working in a factory. The video then transitions back to the train driving down the tracks.", "gt-answer": "B. they happen at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the train is passing by a field of crops while robotic arms work in the background. Then, it mentions that the video shows the robotic arms working on the crops. This suggests that the order of events is first the train passing by, followed by the robotic arms working on the crops.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video shows a train passing by a field of crops while robotic arms work in the background. The video then shows the robotic arms working on the crops.", "gt-answer": "B. they happen at the same time", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the trains are seen driving through the countryside first, showcasing the beauty of nature. Then, it mentions that the robotic arms are working in a factory, highlighting their efficiency and precision. Therefore, the correct order of events in the video is: trains are driving, then robotic arms are working.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases the harmonious coexistence of trains and robotic arms in a serene environment. The trains are seen driving through the countryside, while the robotic arms are working in a factory. The video highlights the efficiency and precision of the robotic arms in performing their tasks. The trains are seen driving through the countryside, showcasing the beauty of nature. The video emphasizes the importance of balance and harmony between technology and nature.", "gt-answer": "B. they happen at the same time", "rating": 0 } ] }, "1076877854_1073914229_1": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the events occur in a specific order. It starts with a train driving through a field of green plants, followed by a scene of robotic arms working in a factory. Then, the video transitions back to the field, where the train is seen driving again. Therefore, the correct answer is:", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases the efficiency of modern technology in agriculture. It starts with a train driving through a field of green plants, followed by a scene of robotic arms working in a factory. The video then transitions back to the field, where the train is seen driving again. The video highlights the importance of technology in agriculture and how it can help increase productivity and efficiency. The use of trains and robotic arms in the video emphasizes the importance of technology in modern agriculture. The video also highlights the importance of technology in agriculture and how it can help increase productivity and efficiency. Overall, the", "gt-answer": "C. robotic arms are working, then trains are driving", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the events occur in the following order: first, the serene landscape of a lush green field is showcased; then, the robotic arms working in a factory are shown; finally, the video transitions to the trains driving on the tracks.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases the harmonious coexistence of nature and technology. The serene landscape of a lush green field is juxtaposed with the mechanical precision of robotic arms working in a factory. The video then transitions to the trains driving on the tracks, showcasing the efficiency and speed of modern transportation. The video highlights the interconnectedness of nature and technology, emphasizing the importance of preserving the natural environment while advancing technological progress.", "gt-answer": "C. robotic arms are working, then trains are driving", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video showcases both trains driving through the landscape and robotic arms working in the background. It also mentions that the scene shifts to the robotic arms working in the same countryside setting, with trains driving by in the background. Based on this information, it can be inferred that trains driving occur before robotic arms are working.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases the harmonious coexistence of trains and robotic arms in a serene countryside setting. The video begins with trains driving through the picturesque landscape, while the robotic arms work in the background. The scene then shifts to the robotic arms working in the same countryside setting, with trains driving by in the background. The video highlights the beauty of nature and the efficiency of modern technology.", "gt-answer": "C. robotic arms are working, then trains are driving", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the trains gracefully glide through the landscape, and the robotic arms work in unison with the trains. This suggests that the trains are driving first, followed by the robotic arms working.", "chatgpt-answer": "A. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases the harmonious coexistence of nature and technology. The serene green fields and the lush vegetation provide a picturesque backdrop for the trains that gracefully glide through the landscape. The robotic arms work in unison with the trains, showcasing the efficiency and precision of modern technology. The video highlights the importance of preserving nature while embracing the advancements of technology.", "gt-answer": "C. robotic arms are working, then trains are driving", "rating": 0 } ] }, "1076877854_1073914229_2": { "order": [ { "chatgpt-reasoning": "The video description mentions that the robotic arms are seen working in a factory, while the trains are driving on the tracks. This implies that the events are happening simultaneously.", "chatgpt-answer": "C. they happen at the same time", "video-llm-prediction": "The video showcases the efficiency of robotic arms and trains working together in a harmonious manner. The robotic arms are seen working in a factory, while the trains are driving on the tracks. The video emphasizes the importance of teamwork and collaboration between humans and machines. The video also highlights the potential of technology to improve productivity and efficiency in various industries. The video is a testament to the power of technology and its ability to revolutionize the way we work.", "gt-answer": "B. trains are driving, then robotic arms are working", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video begins with trains driving along the tracks, followed by robotic arms working in the same field. Then it transitions to show the robotic arms working in the same field as the trains drive by. This indicates that the trains are driving first, followed by the robotic arms working.", "chatgpt-answer": "B. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases the harmonious collaboration between trains and robotic arms in a green field. The video begins with trains driving along the tracks, followed by robotic arms working in the same field. The video then transitions to show the robotic arms working in the same field as the trains drive by. The video highlights the efficiency and coordination between the two modes of transportation.", "gt-answer": "B. trains are driving, then robotic arms are working", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the video showcases a train passing by a field of green plants, followed by a close-up of the plants. Then, it shifts to a factory where robotic arms are working on the plants, and trains are driving by. This indicates that the trains driving come after the close-up of the plants and the robotic arms working.", "chatgpt-answer": "B. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases a train passing by a field of green plants, followed by a close-up of the plants. The scene then shifts to a factory where robotic arms are working on the plants, and trains are driving by. The video highlights the beauty of nature and the advancements in technology.", "gt-answer": "B. trains are driving, then robotic arms are working", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the train passing by the field of green plants is followed by a scene of robotic arms working in a factory. Then, the video transitions back to the field of green plants with the train passing by again. This indicates that the events occur in the order of trains driving first, then robotic arms working.", "chatgpt-answer": "B. trains are driving, then robotic arms are working", "video-llm-prediction": "The video showcases a train passing by a field of green plants, followed by a scene of robotic arms working in a factory. The video then transitions to a scene of the same field of green plants, with the train passing by again. The video highlights the beauty of nature and the advancements in technology.", "gt-answer": "B. trains are driving, then robotic arms are working", "rating": 1 } ] }, "1067268406_1067427023_0": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the white car is driving on the highway while the snow particles are melting simultaneously. This implies that both events are happening at the same time.", "chatgpt-answer": "B. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "The video shows a white car driving on a highway while snow particles are melting simultaneously. The car is seen driving on the highway while the snow particles are melting. The video captures the serene beauty of the highway with the snow melting in the background. The video showcases the contrast between the car's movement and the melting snow particles, creating a visually appealing scene. The video is a perfect representation of the beauty of nature and the peacefulness of driving on a highway.", "gt-answer": "B. a white car is driving while snow particles are melting simultaneously", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the white car is seen driving on the highway while snow particles are melting simultaneously. This suggests that both events are happening at the same time.", "chatgpt-answer": "B. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "The video showcases a white car driving down a highway while snow particles are melting simultaneously. The car is seen driving on the highway, and the snow particles are melting, creating a serene and picturesque scene. The video captures the beauty of nature and the tranquility of the highway, making it a perfect watch for anyone seeking a moment of peace and relaxation.", "gt-answer": "B. a white car is driving while snow particles are melting simultaneously", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that both the white car is driving and the snow particles are melting simultaneously.", "chatgpt-answer": "B. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A white car is driving on a highway while snow particles are melting simultaneously.", "gt-answer": "B. a white car is driving while snow particles are melting simultaneously", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the white car is driving down a highway while snow particles are melting. Since there is no specific mention of the order in which these events occur, it can be assumed that they are happening simultaneously.", "chatgpt-answer": "B. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "The video shows a white car driving down a highway while snow particles are melting. The car is seen driving on a bridge and on a highway with grass on the side. The video also shows a car driving on a highway with grass on the side, and a car driving on a highway with grass on the side.", "gt-answer": "B. a white car is driving while snow particles are melting simultaneously", "rating": 1 } ] }, "1067268406_1067427023_1": { "order": [ { "chatgpt-reasoning": "Based on the video description, the order of events in the video is that a white car is driving down a highway, passing by wind turbines. The camera then pans to show the wind turbines in the background. This sequence repeats multiple times, indicating that the car continues driving down the highway and passing by more wind turbines.", "chatgpt-answer": "C. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "The video starts with a white car driving down a highway, passing by wind turbines. The camera then pans to show the wind turbines in the background. The car continues driving down the highway, passing by more wind turbines. The camera then pans to show the wind turbines in the background. The car continues driving down the highway, passing by more wind turbines. The camera then pans to show the wind turbines in the background. The car continues driving down the highway, passing by more wind turbines. The camera then pans to show the wind turbines in", "gt-answer": "A. a white car is driving, then snow particles are melting", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white car is driving down a highway, passing by wind turbines, and then stopping to allow the snow particles to melt. This indicates that first, the white car is driving, then the snow particles are melting.", "chatgpt-answer": "A. a white car is driving, then snow particles are melting", "video-llm-prediction": "The video showcases a white car driving down a highway, passing by wind turbines, and then stopping to allow the snow particles to melt.", "gt-answer": "A. a white car is driving, then snow particles are melting", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that a white car is seen driving down a highway while snow particles are melting simultaneously. This indicates that both events are happening at the same time.", "chatgpt-answer": "C. A white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A white car is seen driving down a highway while snow particles are melting simultaneously. The video captures the serene beauty of the snowy landscape as the car moves forward. The sound of the engine and the crunching of the snow under the tires can be heard, adding to the immersive experience. The video ends with the car disappearing into the distance, leaving behind a trail of snow particles.", "gt-answer": "A. a white car is driving, then snow particles are melting", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white car is driving down a highway while snow particles are melting simultaneously. This means that both events are happening at the same time, so option C is the correct answer.", "chatgpt-answer": "C. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A white car is driving down a highway while snow particles are melting simultaneously. The video showcases the serene beauty of nature and the peacefulness of driving on a highway.", "gt-answer": "A. a white car is driving, then snow particles are melting", "rating": 0 } ] }, "1067268406_1067427023_2": { "order": [ { "chatgpt-reasoning": "The video description mentions that the order of events is \"a white car is driving while snow particles are melting simultaneously\".", "chatgpt-answer": "A. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "The video shows a white car driving down a highway while snow particles are melting simultaneously. The car is seen driving on a bridge and a highway, and the video captures the serene beauty of the snowy landscape. The video also shows the car driving on a bridge and a highway, and the snowy landscape is breathtaking. The video is a perfect representation of the beauty of nature and the joy of driving on a beautiful day.", "gt-answer": "B. snow particles are melting, then a white car is driving", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, it is mentioned that the video showcases a white car driving down a highway while snow particles are melting simultaneously. This indicates that the car's movement is happening alongside the melting of the snow particles.", "chatgpt-answer": "A. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "The video showcases a white car driving down a highway while snow particles are melting simultaneously. The car's movement is captured from different angles, and the camera captures the car's speed and movement. The video also highlights the beauty of the snowy landscape and the serene atmosphere of the highway. The video's focus is on the car's journey and the surrounding environment, creating a sense of tranquility and freedom.", "gt-answer": "B. snow particles are melting, then a white car is driving", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the white car is driving on a highway while snow particles are melting simultaneously. This indicates that both events are happening at the same time.", "chatgpt-answer": "A. a white car is driving while snow particles are melting simultaneously", "video-llm-prediction": "A white car is driving on a highway while snow particles are melting simultaneously.", "gt-answer": "B. snow particles are melting, then a white car is driving", "rating": 0 }, { "chatgpt-reasoning": "The video description states that \"A white car is driving on a highway while snow particles are melting simultaneously\", indicating that the car is driving first and then the snow particles are melting.", "chatgpt-answer": "C. a white car is driving, then snow particles are melting", "video-llm-prediction": "A white car is driving on a highway while snow particles are melting simultaneously. The video captures the serene beauty of the snowy landscape and the peacefulness of the drive.", "gt-answer": "B. snow particles are melting, then a white car is driving", "rating": 0 } ] }, "1086286649": { "action": [ { "chatgpt-reasoning": "The video description mentions that the armored vehicles are parked in the middle of the road and are firing at each other. This indicates that the correct answer should be D. Firing, as they are engaged in a firefight.", "chatgpt-answer": "D. Firing", "video-llm-prediction": "The video shows a group of armored vehicles driving down a snowy road. The vehicles are parked in the middle of the road, and they are firing at each other. The video also shows a man standing in the middle of the road.", "gt-answer": "C. Driving", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the armored vehicles are seen parked, driving down the road, and firing at each other.", "chatgpt-answer": "D. Firing", "video-llm-prediction": "The video shows a group of armored vehicles driving down a snowy road. The vehicles are seen parked and driving down the road, and they are also shown firing at each other. The video captures the movement and actions of the vehicles in the snowy environment.", "gt-answer": "C. Driving", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the armored vehicles are driving down a snowy road and one of them is firing a weapon. It also states that the vehicles are parked in the snow. Therefore, the correct answer is D. Firing.", "chatgpt-answer": "D. Firing", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road, with one of them firing a weapon. The video also shows the vehicles parked in the snow.", "gt-answer": "C. Driving", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that one of the armored vehicles is firing a weapon. Additionally, it states that the vehicles are parked in the snow and there is a person loading people into one of them.", "chatgpt-answer": "D. Firing", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road, with one of them firing a weapon. The vehicles are parked in the snow, and a person is seen loading people into one of them.", "gt-answer": "C. Driving", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "In the video description, it is mentioned that the first vehicle is driving towards the camera while the second vehicle is driving away from the camera. This means that the armored vehicles are moving from left to right from the camera's point of view.", "chatgpt-answer": "C. Left to right", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road. The first vehicle is driving towards the camera while the second vehicle is driving away from the camera. The vehicles are moving in opposite directions, and the snowy road is covered with snow. The video captures the serene beauty of the snowy landscape and the vehicles' movement.", "gt-answer": "B. Right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that one of the vehicles is driving in the opposite direction. Since it does not specify which direction the camera is facing, we can assume that the camera is stationary and the armored vehicles are moving relative to the camera's point of view.", "chatgpt-answer": "A. Stationary", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road, with one of them driving in the opposite direction. The vehicles are surrounded by snow and trees, and the road is covered in snow. The video captures the serene beauty of winter, with the snow-covered landscape and the vehicles driving through it. The sound of the vehicles' engines and the crunching of the snow under their wheels can be heard, adding to the immersive experience. The video is a perfect representation of the winter season, with its snowy landscape and the vehicles driving through it.", "gt-answer": "B. Right to left", "rating": 0 }, { "chatgpt-reasoning": "The video description states that one vehicle is driving towards the camera while the other is driving away from it. The term \"towards\" indicates movement in the direction of the camera, and \"away\" indicates movement in the opposite direction. Therefore, the armored vehicle driving towards the camera is moving left to right, while the one driving away from the camera is moving right to left.", "chatgpt-answer": "C. Left to right", "video-llm-prediction": "Two armored vehicles are driving down a snowy road. One vehicle is driving towards the camera while the other is driving away from it. The vehicles are moving in opposite directions.", "gt-answer": "B. Right to left", "rating": 0 }, { "chatgpt-reasoning": "In the video description, it is mentioned that the armored vehicles are stationary. Therefore, they are not moving from the camera's point of view.", "chatgpt-answer": "A. Stationary", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road. The vehicles are stationary, and the camera captures them from behind. The video does not provide any additional information.", "gt-answer": "B. Right to left", "rating": 0 } ], "speed": [ { "chatgpt-reasoning": "The video description states that the first vehicle is driving slowly, while the second vehicle is driving rapidly. Therefore, both armored vehicles are moving, but at different speeds - the first vehicle is moving slowly and the second vehicle is moving rapidly.", "chatgpt-answer": "C. Slowly", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road. The first vehicle is driving slowly, while the second vehicle is driving rapidly. The video does not provide any information about the speed of the first vehicle.", "gt-answer": "C. Slowly", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically states that one of the armored vehicles is driving slowly.", "chatgpt-answer": "C. Slowly", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road, with one of them driving slowly. The video also shows a man standing in the snow, and a person walking in the snow.", "gt-answer": "C. Slowly", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that one armored vehicle is moving slowly and the other is moving rapidly.", "chatgpt-answer": "C. Slowly", "video-llm-prediction": "Two armored vehicles are driving down a snowy road, one moving slowly and the other rapidly.", "gt-answer": "C. Slowly", "rating": 1 }, { "chatgpt-reasoning": "The video description states that one of the armored vehicles is driving slowly down the snowy road.", "chatgpt-answer": "C. Slowly", "video-llm-prediction": "The video shows two armored vehicles driving down a snowy road, with one of them driving slowly. The vehicles are surrounded by snowy landscapes, and the video captures the serene beauty of winter.", "gt-answer": "C. Slowly", "rating": 1 } ] }, "1093041749": { "action": [ { "chatgpt-reasoning": "The video description mentions that the dragon is seen flying, swimming, and breathing fire.", "chatgpt-answer": "A. flying, B. swimming, and C. breathing fire", "video-llm-prediction": "The video features a dragon that is seen flying, swimming, and breathing fire. The dragon is shown in various positions, including standing on a beach and in the water. The video also shows the dragon in a fiery inferno, adding to the overall dramatic effect.", "gt-answer": "C. breathing fire", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the dragon is seen flying over a city, then swimming in the water, and finally breathing fire. This indicates that the dragon is performing multiple actions, including flying, swimming, and breathing fire.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A dragon is seen flying over a city, then swimming in the water, and finally breathing fire.", "gt-answer": "C. breathing fire", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the dragon is seen flying in the sky, swimming in the water, and breathing fire. This means that the dragon is doing all three actions mentioned.", "chatgpt-answer": "A. flying, B. swimming, C. breathing fire", "video-llm-prediction": "A dragon is seen flying in the sky, swimming in the water, and breathing fire.", "gt-answer": "C. breathing fire", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the dragon is seen flying in the sky, swimming in the water, and breathing fire. Therefore, the correct answer is all of the above (A. flying, B. swimming, C. breathing fire).", "chatgpt-answer": "A. flying, B. swimming, C. breathing fire", "video-llm-prediction": "A dragon is seen flying in the sky, swimming in the water, and breathing fire.", "gt-answer": "C. breathing fire", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description clearly states that the dragon first flies to the sky and then breathes fire. After that, it lands from the sky and breathes fire again. Therefore, the correct answer is option A.", "chatgpt-answer": "A. flying to the sky and then breathing fire", "video-llm-prediction": "The video shows a dragon flying to the sky and then breathing fire. The dragon then lands from the sky and breathes fire again.", "gt-answer": "B. landing from the sky and then breathing fire", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dragon first flies to the sky and then breathes fire. After that, it lands and continues to breathe fire.", "chatgpt-answer": "A. flying to the sky and then breathing fire", "video-llm-prediction": "A dragon is seen flying to the sky and then breathing fire. It then lands and continues to breathe fire.", "gt-answer": "B. landing from the sky and then breathing fire", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the dragon is first seen flying to the sky and then breathing fire.", "chatgpt-answer": "A. flying to the sky and then breathing fire", "video-llm-prediction": "A dragon is seen flying to the sky and then breathing fire.", "gt-answer": "B. landing from the sky and then breathing fire", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the dragon flies to the sky first and then breathes fire. After that, it lands back on the ground and continues to breathe fire. Therefore, the correct order of events performed by the dragon is \"flying to the sky and then breathing fire\".", "chatgpt-answer": "A. flying to the sky and then breathing fire", "video-llm-prediction": "The video features a dragon that flies to the sky and then breathes fire. The dragon then lands back on the ground and continues to breathe fire.", "gt-answer": "B. landing from the sky and then breathing fire", "rating": 0 } ] }, "1076180768": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the knight is performing multiple actions - riding a horse, wielding a spear, drawing a sword from a sheath, and shooting an arrow.", "chatgpt-answer": "A. riding a horse, B. wielding a spear, C. drawing sword from sheath, D. shooting an arrow", "video-llm-prediction": "A knight is seen riding a horse, wielding a spear, drawing a sword from a sheath, and shooting an arrow.", "gt-answer": "C. drawing sword from sheath", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the knight is seen riding a horse, wielding a spear, drawing a sword from his sheath, and shooting an arrow.", "chatgpt-answer": "A. riding a horse, B. wielding a spear, C. drawing sword from sheath, D. shooting an arrow", "video-llm-prediction": "A knight is seen riding a horse, wielding a spear, and drawing a sword from his sheath. The video also shows the knight shooting an arrow.", "gt-answer": "C. drawing sword from sheath", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the knight is seen \"riding a horse, wielding a spear, drawing a sword from his sheath, and shooting an arrow.\" This means that the knight is engaging in all of these actions.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "A knight is seen riding a horse, wielding a spear, drawing a sword from his sheath, and shooting an arrow.", "gt-answer": "C. drawing sword from sheath", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the knight is seen riding a horse, wielding a spear, drawing a sword from his sheath, and shooting an arrow. This indicates that the knight is doing multiple actions in the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A knight is seen riding a horse, wielding a spear, and drawing a sword from his sheath. The video also shows the knight shooting an arrow.", "gt-answer": "C. drawing sword from sheath", "rating": 0 } ] }, "3406661033": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is in a wheelchair and propelling himself forward. There is no mention of swimming or walking.", "chatgpt-answer": "A. propelling himself forward in wheelchair", "video-llm-prediction": "A man in a wheelchair is seen propelling himself forward in a spacious room. He is wearing a grey shirt and black pants, and he is moving at a steady pace. The room is well-lit, with a large window in the background. The man is accompanied by a woman who is sitting at a table, working on a laptop. The woman is wearing a white shirt and black pants, and she is focused on her work. The man continues to move forward, passing by the woman and the table. The video captures the man's determination and resilience as", "gt-answer": "A. propelling himself forward in wheelchair", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is first seen moving forward in a wheelchair, then swimming, and finally walking.", "chatgpt-answer": "C. walking", "video-llm-prediction": "A man in a wheelchair is seen moving forward, while a woman is seen reading a document. The man then proceeds to swim, and later, he is seen walking.", "gt-answer": "A. propelling himself forward in wheelchair", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the man is in a wheelchair and is propelling himself forward.", "chatgpt-answer": "A. propelling himself forward in wheelchair", "video-llm-prediction": "A man in a wheelchair is seen propelling himself forward, while a woman is seen swimming and another man is seen walking.", "gt-answer": "A. propelling himself forward in wheelchair", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a man in a wheelchair is seen moving forward, while another man is swimming and the third man is walking. This indicates that the man in the wheelchair is propelling himself forward.", "chatgpt-answer": "A. propelling himself forward in wheelchair", "video-llm-prediction": "A man in a wheelchair is seen moving forward, while another man is swimming. The third man is walking.", "gt-answer": "A. propelling himself forward in wheelchair", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description clearly states that the man in the wheelchair first hands the document to his colleagues and then stands up from the wheelchair. There is no mention of him propelling himself forward in the wheelchair.", "chatgpt-answer": "A. The man hands the document to colleagues and then stands up from the wheelchair", "video-llm-prediction": "The video shows a man in a wheelchair who hands a document to his colleagues. He then stands up from the wheelchair and hands the document to his colleagues.", "gt-answer": "B. The man propels himself forward in wheelchair and then hands the document to colleagues.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man first hands the document to his colleagues and then stands up from the wheelchair.", "chatgpt-answer": "A. The man hands the document to colleagues and then stands up from the wheelchair", "video-llm-prediction": "The video shows a man in a wheelchair who hands a document to his colleagues. He then stands up from the wheelchair and hands the document to his colleagues. The video captures the man's actions of standing up and handing the document to his colleagues.", "gt-answer": "B. The man propels himself forward in wheelchair and then hands the document to colleagues.", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man in the wheelchair hands a document to his colleagues, then stands up and hands it to them again. This implies that the order of events is first handing the document to colleagues, then standing up from the wheelchair.", "chatgpt-answer": "A. The man hands the document to colleagues and then stands up from the wheelchair.", "video-llm-prediction": "A man in a wheelchair hands a document to his colleagues, then stands up and hands it to them again.", "gt-answer": "B. The man propels himself forward in wheelchair and then hands the document to colleagues.", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man first hands the document to his colleagues and then stands up from the wheelchair.", "chatgpt-answer": "A. The man hands the document to colleagues and then stands up from the wheelchair", "video-llm-prediction": "A man in a wheelchair hands a document to his colleagues and then stands up from the wheelchair.", "gt-answer": "B. The man propels himself forward in wheelchair and then hands the document to colleagues.", "rating": 0 } ] }, "3406618583": { "action": [ { "chatgpt-reasoning": "The video description explicitly mentions that the woman starts with a hip-hop dance, then switches to a salsa dance, moves on to a ballet dance, and finally ends with a freestyle dance. Therefore, all of these dance styles are mentioned in the description.", "chatgpt-answer": "A. hip-hop, B. salsa, C. ballet, D. freestyle dance", "video-llm-prediction": "A woman is seen dancing in a room with a window. She starts by doing a hip-hop dance and then switches to a salsa dance. She then moves on to a ballet dance and finally ends with a freestyle dance.", "gt-answer": "D. freestyle dance", "rating": 0 }, { "chatgpt-reasoning": "The video description does not provide specific details about the type of dance the woman is performing. It only mentions that her movements are fluid and graceful, and she appears to be enjoying herself while dancing around the room. Without any clear indication or mention of a specific dance style, it is impossible to determine the exact type of dance.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a woman who is seen dancing in a room. She starts by moving her arms and legs around, and then proceeds to dance around the room. The woman's movements are fluid and graceful, and she appears to be enjoying herself. The room is well-lit, and there are a few pieces of furniture visible in the background. The woman's outfit is casual, and she seems to be wearing comfortable clothes. Overall, the video captures a moment of joy and freedom as the woman dances around the room.", "gt-answer": "D. freestyle dance", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is performing hip-hop, salsa, ballet, and freestyle dance moves.", "chatgpt-answer": "A. hip-hop, B. salsa, C. ballet, D. freestyle dance", "video-llm-prediction": "A woman in a blue dress dances in a room with a window. She performs hip-hop, salsa, ballet, and freestyle dance moves.", "gt-answer": "D. freestyle dance", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is performing a freestyle dance.", "chatgpt-answer": "D. freestyle dance", "video-llm-prediction": "A woman in a blue dress performs a freestyle dance in a room with a window.", "gt-answer": "D. freestyle dance", "rating": 1 } ], "direction": [ { "chatgpt-reasoning": "From the video description, there is no mention of any camera movement or change in perspective. The description focuses on the actions and positions of the woman, rather than the camera movement.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video features a woman who is seen dancing in a room. She is wearing a blue dress and is seen dancing in front of a mirror. The woman is also seen standing in front of a window and holding a cell phone. The video is shot in a room with a window and a mirror. The woman is seen dancing in different positions, including standing and sitting. The video ends with the woman standing in front of the mirror.", "gt-answer": "B. panning up and down around the girl", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera showcases the woman's dance routine and ends with her walking away from the camera. There are no specific details provided about the camera movement, such as panning, rotating, or zooming. Therefore, it is not possible to determine the direction of the camera movement based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a woman performing a dance routine in a room. She starts by standing in front of a mirror and then proceeds to dance around the room. The woman's movements are fluid and graceful, and she appears to be enjoying herself. The room is well-lit, and the woman's outfit is casual and comfortable. The video ends with the woman finishing her dance and walking away from the camera. Overall, the video is a beautiful display of the woman's talent and passion for dance.", "gt-answer": "B. panning up and down around the girl", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is seen dancing and moving her arms around while the camera continues to dance around the room. From this information, we can infer that the camera movement is not focused on a specific point but is moving in sync with the woman's movements.", "chatgpt-answer": "A. panning left and right around the girl", "video-llm-prediction": "A woman in a room is seen dancing and moving her arms around. She continues to dance around the room while looking off into the distance.", "gt-answer": "B. panning up and down around the girl", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions various actions of the woman, but does not provide any information about the camera movement. Therefore, we cannot determine the direction of the camera movement based on the given description.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A woman is seen dancing in a room with a window. She is wearing a blue dress and has her hair in a bun. She starts by dancing with her hands up and then moves her hands down. She continues to dance and ends by waving.", "gt-answer": "B. panning up and down around the girl", "rating": 0 } ] }, "3405120819": { "action": [ { "chatgpt-reasoning": "The video description mentions that the chef is cutting dough, shaping it, and then placing it in a dish. All of the choices are correct based on the description.", "chatgpt-answer": "A. cutting dough, B. shaping dough, C. placing dough in a dish", "video-llm-prediction": "A chef is shown in a kitchen, cutting dough and shaping it. He then places the dough in a dish.", "gt-answer": "B. shaping dough", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the chef is cutting dough, shaping it, and placing it in a dish.", "chatgpt-answer": "A. cutting dough, B. shaping dough, C. placing dough in a dish", "video-llm-prediction": "A chef is seen in a kitchen, cutting dough and shaping it. He then places the dough in a dish and smiles.", "gt-answer": "B. shaping dough", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the chef is cutting dough, shaping it, and placing it in a dish.", "chatgpt-answer": "A. cutting dough, B. shaping dough, C. placing dough in a dish", "video-llm-prediction": "A chef is seen cutting dough, shaping it, and placing it in a dish.", "gt-answer": "B. shaping dough", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the chef is cutting dough, shaping it, and placing it in a dish.", "chatgpt-answer": "A. cutting dough, B. shaping dough, C. placing dough in a dish", "video-llm-prediction": "A chef is seen cutting dough, shaping it, and placing it in a dish.", "gt-answer": "B. shaping dough", "rating": 0 } ], "order": [ { "chatgpt-reasoning": "The video description mentions that the chef is cutting dough and shaping it into a ball. The description also states that the chef smiles at the camera and continues shaping the dough. Therefore, the correct order of actions performed by the chef is cutting dough and then shaping dough.", "chatgpt-answer": "A. cutting dough and then shaping dough", "video-llm-prediction": "A chef is seen cutting dough and shaping it into a ball. He then smiles at the camera and continues shaping the dough. The video showcases the process of making dough and shaping it into a ball. The chef's actions are consistent with the video, and he is seen cutting and shaping dough throughout the video.", "gt-answer": "C. shaping dough and then smiling at the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the chef is cutting and shaping dough, and then smiling at the camera. Therefore, the correct order of actions is cutting dough and then shaping dough.", "chatgpt-answer": "A. cutting dough and then shaping dough", "video-llm-prediction": "The video features a chef who is seen cutting and shaping dough, and then smiling at the camera. The chef is shown in a kitchen, and he is wearing a chef's uniform. The video seems to be a tutorial on how to make dough, and the chef is demonstrating the process step by step. The video is shot in a clear and concise manner, making it easy to follow along. Overall, the video is informative and helpful for anyone who wants to learn how to make dough.", "gt-answer": "C. shaping dough and then smiling at the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the chef first cuts the dough and then shapes it before smiling at the camera.", "chatgpt-answer": "A. cutting dough and then shaping dough", "video-llm-prediction": "A chef is seen cutting dough and shaping it before smiling at the camera.", "gt-answer": "C. shaping dough and then smiling at the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the chef is first shaping the dough and then cutting it. There is no mention of the chef smiling at the camera or any other actions.", "chatgpt-answer": "C. shaping dough and then smiling at the camera", "video-llm-prediction": "A chef is seen shaping dough and then cutting it. He then smiles at the camera.", "gt-answer": "C. shaping dough and then smiling at the camera", "rating": 1 } ] }, "3405088753": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman takes the bag of bread and leaves the bakery, indicating that she is buying bread.", "chatgpt-answer": "C. buying bread", "video-llm-prediction": "A man in a bakery is seen wrapping a bag of bread to a woman. The woman then takes the bag and leaves the bakery.", "gt-answer": "C. buying bread", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man in the bakery puts a bag of bread on the counter and then gives it to the woman who is standing behind the counter. Therefore, it can be inferred that the woman is buying bread.", "chatgpt-answer": "C. buying bread", "video-llm-prediction": "A man in a bakery is seen putting a bag of bread on a counter. He then proceeds to give the bag to a woman who is standing behind the counter. The man then walks away from the counter.", "gt-answer": "C. buying bread", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the woman proceeds to buy bread from the bakery.", "chatgpt-answer": "C. buying bread", "video-llm-prediction": "A man in a bakery is seen holding a basket of bread and talking to a woman. The woman then proceeds to buy bread from the bakery.", "gt-answer": "C. buying bread", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman takes the bag of bread and leaves the bakery. This implies that she is buying bread.", "chatgpt-answer": "C. buying bread", "video-llm-prediction": "A man in a bakery is seen wrapping a bag of bread to a woman. The woman then takes the bag and leaves the bakery.", "gt-answer": "C. buying bread", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description mentions that the salesman is seen in a bakery, packing up bread for a woman. It also states that he then says something to the woman and proceeds to pack up the bread for her. Therefore, the correct order of events would be for the salesman to first pack up the bread for the woman and then say something to her.", "chatgpt-answer": "B. packing up the bread for the woman and then saying something to the woman", "video-llm-prediction": "A salesman is seen in a bakery, packing up bread for a woman. He then says something to the woman and proceeds to pack up the bread for her. The video showcases the salesman's actions in the bakery.", "gt-answer": "B. packing up the bread for the woman and then saying something to the woman", "rating": 1 }, { "chatgpt-reasoning": "Based on the video description, the events involving the salesman occur in a specific order. The salesman is first seen packing up the bread for the woman, and then he is seen saying something to the woman.", "chatgpt-answer": "B. packing up the bread for the woman and then saying something to the woman", "video-llm-prediction": "A salesman is seen packing up bread for a woman while speaking to her. The salesman is wearing a brown apron and glasses. The woman is wearing a white shirt and a black apron. The salesman is seen speaking to the woman while packing up the bread. The salesman is also seen speaking to the woman while packing up the bread. The salesman is seen packing up the bread for the woman and then speaking to her. The salesman is seen packing up the bread for the woman and then saying something to the woman.", "gt-answer": "B. packing up the bread for the woman and then saying something to the woman", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the salesman is seen packing up bread for a woman while saying something to her. This indicates that the action of packing up the bread occurs simultaneously with the action of saying something to the woman.", "chatgpt-answer": "A. They happen at the same time", "video-llm-prediction": "A salesman is seen packing up bread for a woman while saying something to her.", "gt-answer": "B. packing up the bread for the woman and then saying something to the woman", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the salesman is packing up bread for a woman while speaking to her. This implies that the events of packing up the bread and saying something to the woman are happening simultaneously.", "chatgpt-answer": "A. They happen at the same time", "video-llm-prediction": "A salesman is seen packing up bread for a woman while speaking to her.", "gt-answer": "B. packing up the bread for the woman and then saying something to the woman", "rating": 0 } ] }, "3401191309": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that the man is putting on a prosthetic running blade, taking it off, and repairing it. Therefore, all three activities are performed by the man in the video.", "chatgpt-answer": "A. putting on prosthetic running blade", "video-llm-prediction": "A man is seen putting on a prosthetic running blade and taking it off. He is also seen repairing a prosthetic running blade.", "gt-answer": "B. taking off prosthetic running blade", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen putting on a prosthetic running blade and taking it off. It also mentions that he is repairing a prosthetic running blade. This implies that the athletic man is engaged in all three activities in the video.", "chatgpt-answer": "A. putting on prosthetic running blade", "video-llm-prediction": "The video shows a man putting on a prosthetic running blade and taking it off. The man is also seen repairing a prosthetic running blade.", "gt-answer": "B. taking off prosthetic running blade", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen putting on a prosthetic running blade, taking it off, and repairing it.", "chatgpt-answer": "A. putting on prosthetic running blade", "video-llm-prediction": "A man wearing a black shirt and black pants is seen putting on a prosthetic running blade. He then takes it off and repairs it.", "gt-answer": "B. taking off prosthetic running blade", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen putting on a prosthetic running blade, then taking it off and repairing it. Therefore, the correct answer is option B: taking off prosthetic running blade.", "chatgpt-answer": "B. taking off prosthetic running blade", "video-llm-prediction": "A man is seen putting on a prosthetic running blade while kneeling on a blue mat. He then takes off the prosthetic running blade and repairs it.", "gt-answer": "B. taking off prosthetic running blade", "rating": 1 } ] }, "21218935": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the woman is exercising. She is doing sit-ups, which is a form of physical exercise. Additionally, the video mentions that she is smiling at the camera, which suggests that she is enjoying the activity.", "chatgpt-answer": "A. exercising", "video-llm-prediction": "A woman is seen exercising in a video. She is seen doing sit-ups and smiling at the camera.", "gt-answer": "A. exercising", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is exercising.", "chatgpt-answer": "A. exercising", "video-llm-prediction": "A woman is seen exercising in a video.", "gt-answer": "A. exercising", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is exercising.", "chatgpt-answer": "A. exercising", "video-llm-prediction": "A woman is seen exercising in a video.", "gt-answer": "A. exercising", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is exercising.", "chatgpt-answer": "A. exercising", "video-llm-prediction": "A woman is seen exercising in a video.", "gt-answer": "A. exercising", "rating": 1 } ], "order": [ { "chatgpt-reasoning": "The video description mentions that the woman is seen doing push ups and smiling at the camera. Then, she frowns at the camera and continues doing push ups. Therefore, the correct order of events for the woman is doing push ups and then frowning at the camera.", "chatgpt-answer": "B. doing push ups and then frowning at the camera", "video-llm-prediction": "A woman is seen doing push ups and smiling at the camera. She then frowns at the camera and continues doing push ups.", "gt-answer": "A. doing push ups and then smiling at the camera", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is first doing push ups and then smiling at the camera. It does not mention any other actions or emotions in the given order.", "chatgpt-answer": "A. doing push ups and then smiling at the camera", "video-llm-prediction": "The video features a woman who is seen doing push ups and then smiling at the camera. She continues to do more push ups while smiling at the camera.", "gt-answer": "A. doing push ups and then smiling at the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is \"doing push ups and smiling at the camera\". This indicates that she is performing the action of doing push ups first, and then smiling at the camera.", "chatgpt-answer": "A. doing push ups and then smiling at the camera", "video-llm-prediction": "A woman is seen doing push ups and smiling at the camera.", "gt-answer": "A. doing push ups and then smiling at the camera", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is doing push ups and smiling at the camera. This implies that she performs the push ups first and then smiles at the camera.", "chatgpt-answer": "A. doing push ups and then smiling at the camera", "video-llm-prediction": "A woman is seen doing push ups and smiling at the camera.", "gt-answer": "A. doing push ups and then smiling at the camera", "rating": 1 } ] }, "5395244": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the woman is seen walking across a pebble creek and then proceeds to canoe across the same creek.", "chatgpt-answer": "D. walking across the pebble creek", "video-llm-prediction": "A woman is seen walking across a pebble creek. She then proceeds to canoe across the same creek.", "gt-answer": "D. walking across the pebble creek", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is walking across the pebble creek, as well as carrying a stick in her hand. It also describes her taking her time and appearing happy, indicating a leisurely activity like walking rather than a more active one like canoeing, swimming, or running.", "chatgpt-answer": "D. walking across the pebble creek", "video-llm-prediction": "A woman is seen walking across a pebble creek, and she is wearing a blue dress. She is also carrying a stick in her hand. The woman continues to walk across the creek, and she looks very happy. The water in the creek is clear, and you can see the rocks underneath. The woman seems to be enjoying her time in the creek, and she is taking her time to walk across it. The surrounding area is also very beautiful, with lush green trees and a blue sky in the background. Overall, the video captures a serene and peaceful moment of", "gt-answer": "D. walking across the pebble creek", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is canoeing across the pebble creek. She is seen paddling her way through the water while wearing a blue dress.", "chatgpt-answer": "A. canoeing across the pebble creek", "video-llm-prediction": "A woman is seen canoeing across a pebble creek. She is wearing a blue dress and is seen paddling her way through the water. The creek is surrounded by trees and rocks, and the water is crystal clear. The woman seems to be enjoying her time as she paddles her way through the water.", "gt-answer": "D. walking across the pebble creek", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is first seen walking across the pebble creek while holding a stick, then she proceeds to run across the creek. Finally, she canoes across it. Therefore, the correct answer is D. walking across the pebble creek.", "chatgpt-answer": "D. walking across the pebble creek", "video-llm-prediction": "A woman is seen walking across a pebble creek while holding a stick. She then proceeds to run across the creek and finally canoes across it.", "gt-answer": "D. walking across the pebble creek", "rating": 1 } ] }, "1037628617": { "action": [ { "chatgpt-reasoning": "The video description specifically mentions that the person is performing multiple actions, including pressing a keyboard key and rotating a jog dial, clicking a button and rolling a wheel on a mouse, and tapping a touchpad and scrolling with two fingers.", "chatgpt-answer": "A. Pressing a keyboard key and rotating a jog dial", "video-llm-prediction": "A person is seen pressing a keyboard key and rotating a jog dial. The person then clicks a button and rolls a wheel on a mouse. Finally, the person taps a touchpad and scrolls with two fingers.", "gt-answer": "B. clicking button and rolling wheel on a mouse", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the person is pressing a keyboard key and rotating a jog dial, while also clicking a button and rolling a wheel on a mouse. None of the other choices are mentioned in the description.", "chatgpt-answer": "A. Pressing a keyboard key and rotating a jog dial", "video-llm-prediction": "The video showcases a person demonstrating the use of a computer mouse and keyboard. The person is seen pressing a keyboard key and rotating a jog dial, while also clicking a button and rolling a wheel on a mouse. The video provides a clear visual representation of these actions, making it easy for viewers to understand how to use the computer peripherals.", "gt-answer": "B. clicking button and rolling wheel on a mouse", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the person is pressing a keyboard key and rotating a jog dial. None of the other answer choices mention these specific actions.", "chatgpt-answer": "A. Pressing a keyboard key and rotating a jog dial", "video-llm-prediction": "A person is seen pressing a keyboard key and rotating a jog dial.", "gt-answer": "B. clicking button and rolling wheel on a mouse", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the person is pressing a keyboard key and rotating a jog dial, clicking a button and rolling a wheel on a mouse, and tapping a touchpad and scrolling with two fingers.", "chatgpt-answer": "A. Pressing a keyboard key and rotating a jog dial.", "video-llm-prediction": "A person is seen pressing a keyboard key and rotating a jog dial. The person then clicks a button and rolls a wheel on a mouse. Finally, the person taps a touchpad and scrolls with two fingers.", "gt-answer": "B. clicking button and rolling wheel on a mouse", "rating": 0 } ] }, "1066801717": { "action": [ { "chatgpt-reasoning": "Based on the video description, the woman is seen holding a vase with yellow flowers, cutting the stems of the flowers, and arranging them in the vase. She also waters the flowers. Therefore, the correct answer is B. arranging bouquet of daffodils.", "chatgpt-answer": "B. arranging bouquet of daffodils", "video-llm-prediction": "A woman is seen holding a vase with yellow flowers in her hands. She then proceeds to cut the stems of the flowers and places them in the vase. After that, she waters the flowers and arranges them in the vase. The video captures the process of the woman creating a beautiful bouquet of daffodils.", "gt-answer": "B. arranging bouquet of daffodils", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is holding a vase filled with yellow flowers, cutting the stems of the flowers, and arranging them in the vase. This indicates that she is working with the bouquet of daffodils, so the correct answer would be C. cutting bouquet of daffodils.", "chatgpt-answer": "C. cutting bouquet of daffodils", "video-llm-prediction": "A woman is seen holding a vase filled with yellow flowers and talking to the camera. She then proceeds to cut the stems of the flowers and places them in the vase. The woman then proceeds to water the flowers and arranges them in the vase.", "gt-answer": "B. arranging bouquet of daffodils", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is holding a vase filled with yellow flowers and watering it. Then, she proceeds to arrange the flowers in the vase and cuts them. From this information, we can infer that the woman is arranging bouquet of daffodils.", "chatgpt-answer": "B. arranging bouquet of daffodils", "video-llm-prediction": "A woman is seen holding a vase filled with yellow flowers and watering it. She then proceeds to arrange the flowers in the vase and cuts them.", "gt-answer": "B. arranging bouquet of daffodils", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the woman is holding a vase filled with yellow flowers, watering them, and then proceeding to arrange and cut the flowers in the vase. This indicates that she is arranging bouquet of daffodils.", "chatgpt-answer": "B. arranging bouquet of daffodils", "video-llm-prediction": "A woman is seen holding a vase filled with yellow flowers and watering them. She then proceeds to arrange the flowers in the vase and cuts them to make them look even more beautiful.", "gt-answer": "B. arranging bouquet of daffodils", "rating": 1 } ] }, "1088428381": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the woman is holding a gift box, wrapping it with a bow, and then opening it. This indicates that she is in the process of preparing or giving a gift.", "chatgpt-answer": "C. wrapping a gift box", "video-llm-prediction": "A woman is seen holding a gift box and wrapping it with a bow. She then opens the box and smiles.", "gt-answer": "B. opening a gift box", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the woman is holding a gift box, wrapping it with a bow, and then opening the box and smiling. Therefore, the correct answer would be \"C. wrapping a gift box\", as it accurately describes the actions performed by the woman in the video.", "chatgpt-answer": "C. wrapping a gift box", "video-llm-prediction": "A woman is seen holding a gift box and wrapping it with a bow. She then opens the box and smiles.", "gt-answer": "B. opening a gift box", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is seen holding a gift box and wrapping it with a bow. This indicates that she is in the process of wrapping a gift box.", "chatgpt-answer": "C. wrapping a gift box", "video-llm-prediction": "A woman is seen holding a gift box and wrapping it with a bow. She then presents the wrapped box to the camera.", "gt-answer": "B. opening a gift box", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is holding a gift box and wrapping it with a bow. This indicates that she is in the process of wrapping a gift box.", "chatgpt-answer": "C. wrapping a gift box", "video-llm-prediction": "A woman is seen holding a gift box and wrapping it with a bow. She then presents the wrapped box to the camera.", "gt-answer": "B. opening a gift box", "rating": 0 } ] }, "1069593640": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman is seen drying her hair with a towel, washing her face with the same towel, and wrapping the towel around her neck.", "chatgpt-answer": "C. putting a towel on her neck", "video-llm-prediction": "A woman is seen drying her hair with a towel. She then proceeds to wash her face with the same towel. After that, she wraps the towel around her neck.", "gt-answer": "C. putting a towel on her neck", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the woman is seen drying her hair with a towel, washing her face with a towel, and putting a towel on her neck.", "chatgpt-answer": "A. drying hair with a towel, B. washing face with a towel, C. putting a towel on her neck", "video-llm-prediction": "A woman is seen drying her hair with a towel, washing her face with a towel, and putting a towel on her neck.", "gt-answer": "C. putting a towel on her neck", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is drying her hair with a towel, washing her face with the same towel, and putting the towel around her neck.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "A woman is seen drying her hair with a towel. She then proceeds to wash her face with the same towel. Finally, she puts the towel around her neck.", "gt-answer": "C. putting a towel on her neck", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is shown drying her hair with a towel, washing her face with a towel, and putting a towel on her neck.", "chatgpt-answer": "A. drying hair with a towel, B. washing face with a towel, C. putting a towel on her neck", "video-llm-prediction": "A woman is shown drying her hair with a towel, washing her face with a towel, and putting a towel on her neck.", "gt-answer": "C. putting a towel on her neck", "rating": 0 } ] }, "8307961": { "order": [ { "chatgpt-reasoning": "Based on the video description, the man is first walking and simultaneously showing something on his tablet to the woman. Then, he stops and starts chatting with the woman while still showing her something on his tablet.", "chatgpt-answer": "A. Walking and simultaneously showing something on his tablet to a woman", "video-llm-prediction": "The video shows a man and a woman walking down a street while the man is showing something on his tablet to the woman. The man then stops and starts chatting with the woman while still showing her something on his tablet. The video seems to be focused on the man's interaction with the woman and his use of the tablet.", "gt-answer": "B. Chatting with a woman while walking and then showing something on his tablet to a woman", "rating": 0 }, { "chatgpt-reasoning": "In the video description, it is mentioned that the man is first shown walking down the street while showing something on his tablet to a woman. The description then states that the man proceeds to chat with the woman while still walking. Therefore, the correct order of actions performed by the man is first showing something on his tablet to a woman and then chatting with the woman while walking.", "chatgpt-answer": "C. Showing something on his tablet to a woman and then chatting with a woman while walking", "video-llm-prediction": "A man is seen walking down the street while showing something on his tablet to a woman. The man then proceeds to chat with the woman while still walking. The video captures the man's actions of showing something on his tablet and chatting with the woman while walking.", "gt-answer": "B. Chatting with a woman while walking and then showing something on his tablet to a woman", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is initially walking and showing something on his tablet to a woman, then he chats with the woman while walking. This means that the correct order of actions performed by the man is first showing something on his tablet to a woman and then chatting with the woman while walking.", "chatgpt-answer": "C. Showing something on his tablet to a woman and then chatting with a woman while walking", "video-llm-prediction": "A man is seen walking and showing something on his tablet to a woman. He then chats with the woman while walking.", "gt-answer": "B. Chatting with a woman while walking and then showing something on his tablet to a woman", "rating": 0 }, { "chatgpt-reasoning": "The correct order of actions performed by the man is as follows: first, he is walking and simultaneously showing something on his tablet to a woman. Then, he chats with the woman while walking and shows her something on his tablet again.", "chatgpt-answer": "B. Chatting with a woman while walking and then showing something on his tablet to a woman", "video-llm-prediction": "A man is seen walking and simultaneously showing something on his tablet to a woman. The man then chats with the woman while walking and shows her something on his tablet again.", "gt-answer": "B. Chatting with a woman while walking and then showing something on his tablet to a woman", "rating": 1 } ] }, "15439453": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man and woman are dancing the tango in a room with a piano. It also mentions that the man is playing the piano while the woman is dancing. Therefore, the correct answer is A. Tango dancing and playing piano.", "chatgpt-answer": "A. Tango dancing and playing piano", "video-llm-prediction": "The video showcases a man and a woman dancing the tango in a room with a piano. The woman is wearing a red dress and the man is wearing a black suit. The man is playing the piano while the woman is dancing. The video also shows the man and woman dancing in different locations, including a room with a couch and a chair, and a room with a window. The video ends with the man and woman hugging.", "gt-answer": "D. Tango dancing and playing saxophone", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man and woman are dancing the tango, while one of them is playing the piano and the other person is dancing. None of the other choices mention tango dancing or piano playing.", "chatgpt-answer": "A. Tango dancing and playing piano", "video-llm-prediction": "The video showcases a man and a woman dancing the tango in a room with a piano. The man is dressed in a black suit and red tie, while the woman is wearing a red dress. The man starts by playing the piano while the woman dances, and then they switch roles. The man dances while the woman plays the piano, and they end the performance by hugging each other.", "gt-answer": "D. Tango dancing and playing saxophone", "rating": 0 }, { "chatgpt-reasoning": "The video description states that a man and a woman are dancing tango in a room while a man plays the piano. It also mentions that the woman then dances ballet and plays the saxophone, and the man then dances tango and plays the violin. So, the correct answer is:", "chatgpt-answer": "C. Tango dancing and playing violin", "video-llm-prediction": "A man and a woman dance tango in a room while a man plays the piano. The woman then dances ballet and plays the saxophone. The man then dances tango and plays the violin.", "gt-answer": "D. Tango dancing and playing saxophone", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man and woman are dancing tango in a room while a man plays the piano. It also mentions that the woman dances ballet and plays the saxophone, and the man dances tango with a red dress and plays the violin. Based on this information, the activities being performed simultaneously in the video are tango dancing and playing piano.", "chatgpt-answer": "A. Tango dancing and playing piano", "video-llm-prediction": "A man and a woman dance tango in a room while a man plays the piano. The woman then dances ballet and plays the saxophone. The man then dances tango with a red dress and plays the violin. The video ends with the man and woman dancing tango again.", "gt-answer": "D. Tango dancing and playing saxophone", "rating": 0 } ] }, "1107947873": { "action": [ { "chatgpt-reasoning": "The video description mentions multiple actions that the doctor is performing - writing a prescription, giving medicine to a patient, and performing a surgery. However, we cannot determine which specific action the doctor is currently doing as the video does not provide a clear indication of the chronological order of events.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A doctor is seen writing a prescription for a patient. She then proceeds to give the patient the medicine. The doctor is seen performing a surgery on a table.", "gt-answer": "B. giving medicine to a patient", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the doctor is seen writing a prescription for a patient, giving medicine to a patient, and performing a surgery on a table. Based on this information, we can conclude that all three actions are being performed by the doctor in the scenario.", "chatgpt-answer": "A. writing a prescription, B. giving medicine to a patient, and C. performing a surgery", "video-llm-prediction": "A doctor is seen writing a prescription for a patient. She then proceeds to give the patient the medicine. The doctor is seen performing a surgery on a table.", "gt-answer": "B. giving medicine to a patient", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the doctor is seen writing a prescription and giving medicine to a patient. It then mentions that she proceeds to perform a surgery.", "chatgpt-answer": "C. performing a surgery", "video-llm-prediction": "A doctor is seen writing a prescription and giving medicine to a patient. She then proceeds to perform a surgery.", "gt-answer": "B. giving medicine to a patient", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the doctor is seen writing a prescription for a patient and then proceeds to give the patient the medicine. This indicates that the doctor is both writing a prescription and giving medicine to the patient.", "chatgpt-answer": "A. writing a prescription, B. giving medicine to a patient", "video-llm-prediction": "A doctor is seen writing a prescription for a patient. She then proceeds to give the patient the medicine. The video showcases the doctor's professionalism and dedication to her patients.", "gt-answer": "B. giving medicine to a patient", "rating": 0 } ] }, "1081194848": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the researcher is teaching the children how to cook the frog.", "chatgpt-answer": "A. teaching children how to cook a frog", "video-llm-prediction": "In the video, a group of children are shown sitting at a table with a frog on it. A researcher is teaching them how to cook the frog. The children are seen cutting the frog into small pieces and then cooking it. The video is focused on teaching children how to cook a frog.", "gt-answer": "C. teaching children how to dissect a frog", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the researcher is teaching the children how to dissect a frog, as they are cutting the frog open with scissors and observing its internal organs.", "chatgpt-answer": "C. teaching children how to dissect a frog", "video-llm-prediction": "In the video, a group of children are shown sitting around a table with a frog on it. A researcher is teaching them how to dissect the frog. The children are seen cutting the frog open with scissors and observing its internal organs. The researcher is also seen feeding the frog and showing the children how to catch it. The video provides a detailed insight into the process of dissecting a frog and the importance of understanding its internal organs. The children are seen learning and having fun at the same time. Overall, the video is an excellent resource for anyone interested in", "gt-answer": "C. teaching children how to dissect a frog", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the researcher is teaching children how to cook a frog. None of the other choices are mentioned in the video description.", "chatgpt-answer": "A. teaching children how to cook a frog", "video-llm-prediction": "A researcher teaches children how to cook a frog.", "gt-answer": "C. teaching children how to dissect a frog", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the researcher is teaching the children how to dissect a frog.", "chatgpt-answer": "C. teaching children how to dissect a frog", "video-llm-prediction": "In the video, a group of children are shown in a classroom, with a researcher teaching them how to cook a frog. The children are seen holding the frog and cutting it up with the guidance of the researcher. The video is an educational one, aimed at teaching children how to cook a frog. The children are seen learning how to dissect a frog, catch a frog, and feed a frog. The video is an excellent resource for children who are interested in learning about frogs and their habitat.", "gt-answer": "C. teaching children how to dissect a frog", "rating": 1 } ] }, "1091526823": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is opening a book, writing on it, turning over pages, and closing it.", "chatgpt-answer": "D. closing a book", "video-llm-prediction": "A person is seen opening a book, writing on it, turning over pages, and closing it.", "gt-answer": "C. turning over pages of a book", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is opening a book, writing on it, turning over pages, and finally closing the book. Therefore, all of the actions described are happening to the hand in the video.", "chatgpt-answer": "All of the choices are correct", "video-llm-prediction": "A person is seen opening a book, writing on it, turning over pages, and finally closing the book.", "gt-answer": "C. turning over pages of a book", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is opening a book, writing on it, turning over pages, and finally closing the book. Each action corresponds to one of the choices.", "chatgpt-answer": "A. opening a book, B. writing on a book, C. turning over pages of a book, D. closing a book", "video-llm-prediction": "A person is seen opening a book, writing on it, turning over pages, and finally closing the book.", "gt-answer": "C. turning over pages of a book", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is seen opening a book, writing on it, turning over pages, and finally closing it. These actions are all related to interacting with a book, so the correct answer should be the action that specifically describes what the hand is doing with the book.", "chatgpt-answer": "D. closing a book", "video-llm-prediction": "A person is seen opening a book, writing on it, turning over pages, and finally closing it.", "gt-answer": "C. turning over pages of a book", "rating": 0 } ] }, "26631100": { "order": [ { "chatgpt-reasoning": "The video description mentions that the person starts by holding a piece of clay, then holds a clay pot. It then shows three hands holding the clay pot, followed by two hands holding the clay pot. The video ends with a person holding a clay pot.", "chatgpt-answer": "B. Three hands are holding the clay pot, then two hands are holding the clay pot", "video-llm-prediction": "The video shows a person holding a piece of clay and then proceeding to hold a clay pot. Three hands are then shown holding the clay pot, followed by two hands holding the clay pot. The video ends with a person holding a clay pot.", "gt-answer": "B. Three hands are holding the clay pot, then two hands are holding the clay pot", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions the order of events as:", "chatgpt-answer": "C. Two hands are holding the clay pot, then three hands are holding the clay pot", "video-llm-prediction": "The video showcases the process of creating a clay pot. It starts with one hand holding the clay pot, followed by three hands holding the pot. Then, two hands are shown holding the pot, and finally, three hands are holding the pot. The video emphasizes the importance of teamwork and collaboration in achieving a common goal.", "gt-answer": "B. Three hands are holding the clay pot, then two hands are holding the clay pot", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that initially, one hand is holding the clay pot, then three hands are holding the clay pot, and finally, two hands are holding the clay pot.", "chatgpt-answer": "A. One hand is holding the clay pot, then three hands are holding the clay pot", "video-llm-prediction": "A person is seen holding a clay pot in their hands. Then, three hands are shown holding the clay pot. Finally, two hands are shown holding the clay pot.", "gt-answer": "B. Three hands are holding the clay pot, then two hands are holding the clay pot", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the process starts with one hand holding the clay pot, followed by two more hands joining in. This means that the correct order of events is \"One hand is holding the clay pot, then three hands are holding the clay pot.\"", "chatgpt-answer": "A. One hand is holding the clay pot, then three hands are holding the clay pot", "video-llm-prediction": "The video showcases the process of creating a clay pot using three hands. The first hand holds the clay pot, followed by two more hands that join in to create the pot. The video highlights the skill and coordination required to create a pot using this technique.", "gt-answer": "B. Three hands are holding the clay pot, then two hands are holding the clay pot", "rating": 0 } ] }, "1104663381": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is cutting a pizza dough, stretching it, and folding it.", "chatgpt-answer": "A. cutting a pizza dough", "video-llm-prediction": "A man is seen cutting a pizza dough, stretching it, and folding it in a restaurant.", "gt-answer": "B. stretching a pizza dough", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is seen cutting a pizza dough, stretching the dough, and folding it.", "chatgpt-answer": "A. cutting a pizza dough, B. stretching a pizza dough, C. folding a pizza dough", "video-llm-prediction": "A man wearing a blue shirt and an apron is seen cutting a pizza dough. He then stretches the dough and folds it.", "gt-answer": "B. stretching a pizza dough", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the man is seen cutting a pizza dough, stretching the dough, and folding it.", "chatgpt-answer": "A. cutting a pizza dough, B. stretching a pizza dough, C. folding a pizza dough", "video-llm-prediction": "A man in a blue shirt is seen cutting a pizza dough. He then stretches the dough and folds it.", "gt-answer": "B. stretching a pizza dough", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is cutting a pizza dough, stretching it, and folding it in a restaurant. Therefore, all three actions mentioned in the multi-choice question are correct.", "chatgpt-answer": "A. cutting a pizza dough, B. stretching a pizza dough, C. folding a pizza dough", "video-llm-prediction": "A man is seen cutting a pizza dough, stretching it, and folding it in a restaurant.", "gt-answer": "B. stretching a pizza dough", "rating": 0 } ], "direction": [ { "chatgpt-reasoning": "The video description mentions that the man is seen spinning the dough around in the air. This indicates that the pizza dough is rotating.", "chatgpt-answer": "B. clockwise", "video-llm-prediction": "A man wearing a blue shirt and an apron is shown kneading dough in a restaurant. He is wearing a mask and is seen spinning the dough around in the air. The video showcases the process of making pizza dough.", "gt-answer": "A. counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the man is seen spinning the dough around in circles. Since the direction of rotation is not specified, we can assume that the rotation can be either clockwise or counter-clockwise.", "chatgpt-answer": "Either A. counter-clockwise or B. clockwise", "video-llm-prediction": "The video shows a man wearing a blue shirt and an apron, who is kneading dough in a restaurant. He is wearing a mask and is seen spinning the dough around in circles. The man is seen kneading the dough for a while before spinning it around in circles again. The video ends with the man spinning the dough around in circles one last time.", "gt-answer": "A. counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is rotating the dough in a circular motion. Therefore, the pizza dough is rotating.", "chatgpt-answer": "B. clockwise", "video-llm-prediction": "A man is shown kneading dough in a restaurant. He rotates the dough in a circular motion, and the camera captures the action from different angles. The man continues to knead the dough until it reaches the desired consistency.", "gt-answer": "A. counter-clockwise", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man rotates the dough in a circular motion. Since there is no specific mention of the direction, we can assume that the dough is rotating in one direction throughout the video.", "chatgpt-answer": "C. it is not rotating", "video-llm-prediction": "A man in a blue shirt is seen kneading dough in a restaurant. He rotates the dough in a circular motion, and the camera captures the action from different angles. The man continues to knead the dough, and the camera captures the action from different angles. The video ends with the man finishing kneading the dough.", "gt-answer": "A. counter-clockwise", "rating": 0 } ] }, "22100041": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman is seen waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something. Each of the choices corresponds to one of the actions mentioned in the video description.", "chatgpt-answer": "A. waving goodbye, B. clapping her hands, C. doing an invitation gesture, D. pointing towards something", "video-llm-prediction": "A woman is seen waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.", "gt-answer": "C. doing an invitation gesture", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the woman is waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.", "chatgpt-answer": "A. waving goodbye, B. clapping her hands, C. doing an invitation gesture, D. pointing towards something", "video-llm-prediction": "The video features a woman who is seen waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something. The woman appears to be in a good mood and is wearing a blue shirt. The video seems to be shot in a room with a bookshelf in the background. The woman's actions are synchronized with the background music, which adds to the overall ambiance of the video. The video seems to be promoting a product or service, but the specific details are not provided in the given information. Overall, the video is a short and simple clip that showcases", "gt-answer": "C. doing an invitation gesture", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is \"waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.\" This indicates that the woman is performing multiple actions, including waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.", "chatgpt-answer": "None of the choices are correct.", "video-llm-prediction": "A woman in a blue shirt is seen waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.", "gt-answer": "C. doing an invitation gesture", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the woman is waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.", "chatgpt-answer": "A. waving goodbye, B. clapping her hands, C. doing an invitation gesture, D. pointing towards something", "video-llm-prediction": "A woman in a blue shirt is seen waving goodbye, clapping her hands, doing an invitation gesture, and pointing towards something.", "gt-answer": "C. doing an invitation gesture", "rating": 0 } ] }, "1103623921": { "action": [ { "chatgpt-reasoning": "The video description explicitly mentions that the man is playing pool.", "chatgpt-answer": "A. playing pool", "video-llm-prediction": "A man is playing pool and hits the ball with a cue stick. He then hits the ball again and it goes into the pocket.", "gt-answer": "A. playing pool", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the man is playing pool in a dimly lit room. It describes how he takes a shot, hits the ball into the corner pocket, and continues to play. The description also mentions the sound of the ball hitting the pocket, which further supports the idea that the man is playing pool.", "chatgpt-answer": "A. playing pool", "video-llm-prediction": "A man is seen playing pool in a dimly lit room. He takes a shot and hits the ball into the corner pocket. The sound of the ball hitting the pocket echoes throughout the room. The man appears to be focused and determined as he continues to play. The camera captures the movement of the ball as it travels across the table, and the sound of the cue stick hitting the ball. The lighting in the room is low, and the only source of light is the pool table itself. The man seems to be enjoying himself as he plays, and the sound of the ball hitting the pocket adds to the", "gt-answer": "A. playing pool", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the man is playing pool and hitting the balls with a stick.", "chatgpt-answer": "A. playing pool", "video-llm-prediction": "A man is playing pool and hits the balls with a stick.", "gt-answer": "A. playing pool", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is playing pool and hitting the balls with a stick.", "chatgpt-answer": "A. playing pool", "video-llm-prediction": "A man is playing pool and hitting the balls with a stick.", "gt-answer": "A. playing pool", "rating": 1 } ], "speed": [ { "chatgpt-reasoning": "The video description does not provide any information about the speed at which the video is playing. Therefore, we cannot determine the correct answer based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man playing pool and hitting the cue ball with a stick. The cue ball is seen moving around the table, and the man hits it multiple times. The video also shows the man hitting the cue ball with a stick, and the cue ball is seen moving around the table. The video ends with the man hitting the cue ball with a stick.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man continues to hit the balls and the camera captures the movement of the balls. This indicates that the video is playing at normal speed, as it shows the ongoing action in real-time.", "chatgpt-answer": "C. normal speed", "video-llm-prediction": "A man is seen playing pool on a green table. He hits the balls with a cue stick, and the balls move around the table. The man continues to hit the balls, and the camera captures the movement of the balls.", "gt-answer": "C. normal speed", "rating": 1 }, { "chatgpt-reasoning": "Based on the description, there is no indication or mention of the speed at which the video is playing. Therefore, we cannot determine the speed of the video from the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is playing pool and hits the cue ball with a stick. The ball hits the other balls and they scatter.", "gt-answer": "C. normal speed", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the video is played in slow motion, fast forward, and normal speed. It indicates that the video is being played at different speeds.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a man playing pool on a green table. He is seen hitting the cue ball with a cue stick, causing it to hit the other balls on the table. The video is played in slow motion, fast forward, and normal speed, highlighting the different movements of the cue ball and the other balls. The video ends with the man hitting the cue ball again, causing it to hit the other balls on the table.", "gt-answer": "C. normal speed", "rating": 0 } ] }, "1093338031": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is seen clicking on the screen, fixing the screen, cleaning the screen, and finally punching the screen. This indicates that the man is attempting to punch the computer screen.", "chatgpt-answer": "D. punch a computer screen", "video-llm-prediction": "A man is seen sitting in front of a computer screen, and he is seen clicking on the screen. He then proceeds to fix the screen, and then he cleans the screen. Finally, he punches the screen.", "gt-answer": "D. punch a computer screen", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is sitting in front of a computer screen and he clicks on it. Later, he proceeds to fix the screen and then cleans it. Finally, he punches the screen. From this information, we can infer that the man is attempting to punch the computer screen.", "chatgpt-answer": "D. punch a computer screen", "video-llm-prediction": "A man is seen sitting in front of a computer screen, and he clicks on it. He then proceeds to fix the screen, and after that, he cleans it. Finally, he punches the screen, and the video ends.", "gt-answer": "D. punch a computer screen", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen clicking on the computer screen, fixing it, and cleaning it. This implies that he is attempting to fix and clean the computer screen.", "chatgpt-answer": "B. fix a computer screen", "video-llm-prediction": "A man is seen sitting in front of a computer screen and clicking on it. He then proceeds to fix the screen and clean it.", "gt-answer": "D. punch a computer screen", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is sitting in front of a computer screen and fixing it. He then proceeds to clean the screen. This suggests that his intention is to fix the computer screen and then clean it.", "chatgpt-answer": "B. fix a computer screen", "video-llm-prediction": "A man is seen sitting in front of a computer screen, fixing it. He then proceeds to clean the screen.", "gt-answer": "D. punch a computer screen", "rating": 0 } ] }, "1064310466": { "action": [ { "chatgpt-reasoning": "The video description mentions that the man is holding a cocoa seed, peeling it, watering it, and planting it. This indicates that the man is engaging in the process of planting cocoa seeds.", "chatgpt-answer": "B. planting cocoa seeds", "video-llm-prediction": "A man is seen holding a cocoa seed and peeling it. He then proceeds to water the seed and plants it. The video showcases the process of cocoa seed cultivation and processing.", "gt-answer": "D. peeling cocoa seeds", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is holding a cocoa seed and peeling it, as well as holding a cocoa pod and a cocoa bean. Based on this information, it can be inferred that the man is peeling cocoa seeds.", "chatgpt-answer": "D. peeling cocoa seeds", "video-llm-prediction": "The video depicts a man engaging in various activities related to cocoa seeds. He is seen holding a cocoa seed and peeling it, as well as holding a cocoa pod and a cocoa bean. The video also shows a man holding a cocoa pod and a cocoa bean, as well as a cocoa pod and a cocoa bean.", "gt-answer": "D. peeling cocoa seeds", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the man is peeling cocoa seeds and then planting them.", "chatgpt-answer": "D. peeling cocoa seeds", "video-llm-prediction": "A man is seen peeling cocoa seeds and then planting them.", "gt-answer": "D. peeling cocoa seeds", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is first seen peeling cocoa seeds, then planting them, watering them, and finally baking them.", "chatgpt-answer": "D. peeling cocoa seeds", "video-llm-prediction": "A man is seen peeling cocoa seeds and then planting them. He then proceeds to water them and bake them.", "gt-answer": "D. peeling cocoa seeds", "rating": 1 } ] }, "1088497853": { "direction": [ { "chatgpt-reasoning": "The video description mentions that the camera pans around the church, showing its various features. Since the camera is moving horizontally, it indicates a leftwards or rightwards movement. However, there is no information provided specifying the exact direction in which the camera pans. Hence, we cannot conclude the direction of the movement based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a large, old church with a bell tower and a cross on top. The camera pans around the church, showing its various features, including a large arched doorway and a small window. The church is surrounded by a lush green field, and the sky is blue with a few white clouds. The camera then pans out to show the surrounding area, which includes a large mountain in the background.", "gt-answer": "B. upwards", "rating": 0 }, { "chatgpt-reasoning": "The video description does not mention any specific movement or direction. It only describes the location, architecture, and scenery. Therefore, we cannot determine the direction of movement in the video based on the given information.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a beautiful and historic location with a clock tower and a church. The camera pans around the area, capturing the stunning architecture and scenery. The video also includes a shot of a mountain in the background, adding to the overall beauty of the location.", "gt-answer": "B. upwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the church and the surrounding area. Panning typically refers to horizontal movement, so the camera is moving in a leftwards or rightwards direction.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A video of a church with a bell tower and a cross on top. The camera pans around the church and the surrounding area.", "gt-answer": "B. upwards", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the camera pans around the building, which indicates a horizontal movement. The specific direction of the movement is not mentioned, so we cannot determine whether it is leftwards or rightwards.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video showcases a large, old brick building with a small, old brick bell tower on top. The camera pans around the building, capturing its intricate details and the surrounding landscape. The video ends with a panoramic view of the surrounding area.", "gt-answer": "B. upwards", "rating": 0 } ] }, "1106087175": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is drawing on a white sneaker with a green marker and then takes off the sneaker to tie the shoelaces.", "chatgpt-answer": "B. drawing on a white sneaker", "video-llm-prediction": "A man is seen wearing a white sneaker and drawing on it with a green marker. He then takes off the sneaker and ties the shoelaces.", "gt-answer": "B. drawing on a white sneaker", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is wearing a white sneaker, drawing on it with a green marker, and then takes off the sneaker and ties the shoelaces.", "chatgpt-answer": "D. tying shoelaces on a white sneaker", "video-llm-prediction": "A man is seen wearing a white sneaker and drawing on it with a green marker. He then takes off the sneaker and ties the shoelaces.", "gt-answer": "B. drawing on a white sneaker", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen wearing a white sneaker and drawing on it with a green marker. He then takes off the sneaker and ties the shoelaces.", "chatgpt-answer": "D. tying shoelaces on a white sneaker", "video-llm-prediction": "A man is seen wearing a white sneaker and drawing on it with a green marker. He then takes off the sneaker and ties the shoelaces.", "gt-answer": "B. drawing on a white sneaker", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is drawing on a white sneaker and then takes off the sneaker to tie the shoelaces.", "chatgpt-answer": "B. drawing on a white sneaker", "video-llm-prediction": "A man is seen wearing a white sneaker and drawing on it with a green marker. He then takes off the sneaker and ties the shoelaces.", "gt-answer": "B. drawing on a white sneaker", "rating": 1 } ] }, "13324343": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the man is first seen gliding on the skateboard and then tying his shoelaces. After that, he jumps and glides on the skateboard again. Therefore, the correct order of events is A. Man gliding on the skateboard and then tying his shoelaces.", "chatgpt-answer": "A. Man gliding on the skateboard and then tying his shoelaces", "video-llm-prediction": "A man is seen gliding on a skateboard and then tying his shoelaces. He then jumps and glides on the skateboard.", "gt-answer": "B. Man tying his shoelaces and then gliding on the skateboard", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is first seen gliding on the skateboard, then tying his shoelaces, and finally jumping and gliding on the skateboard again. So the correct order of events is A. Man gliding on the skateboard and then tying his shoelaces.", "chatgpt-answer": "A. Man gliding on the skateboard and then tying his shoelaces", "video-llm-prediction": "A man is seen gliding on a skateboard and then tying his shoelaces. He then jumps and glides on the skateboard.", "gt-answer": "B. Man tying his shoelaces and then gliding on the skateboard", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen gliding on a skateboard first, and then he ties his shoelaces.", "chatgpt-answer": "A. Man gliding on the skateboard and then tying his shoelaces", "video-llm-prediction": "A man is seen gliding on a skateboard, then he ties his shoelaces.", "gt-answer": "B. Man tying his shoelaces and then gliding on the skateboard", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the man is first seen gliding on a skateboard, then tying his shoelaces, and finally jumping and tying his shoelaces again.", "chatgpt-answer": "A. Man gliding on the skateboard and then tying his shoelaces", "video-llm-prediction": "A man is seen gliding on a skateboard and then tying his shoelaces. He then jumps and ties his shoelaces again.", "gt-answer": "B. Man tying his shoelaces and then gliding on the skateboard", "rating": 0 } ] }, "1083624811": { "action": [ { "chatgpt-reasoning": "The video description states that the woman is performing push-ups, alternating leg lift plank, traditional plank hold, and side plank variations.", "chatgpt-answer": "A. performing push-ups, B. performing alternating leg lift plank, C. performing a traditional plank hold, D. performing side plank variations", "video-llm-prediction": "A woman is seen performing push-ups on a blue mat. She then moves on to performing alternating leg lift plank and a traditional plank hold. The woman continues to perform side plank variations while maintaining her balance.", "gt-answer": "B. performing alternating leg lift plank", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the woman is performing a variety of exercises, including push-ups, alternating leg lift plank, traditional plank hold, and side plank variations.", "chatgpt-answer": "A. performing push-ups, B. performing alternating leg lift plank, C. performing a traditional plank hold, D. performing side plank variations", "video-llm-prediction": "The video showcases a woman performing a variety of exercises on a blue mat. She starts by doing push-ups and then moves on to performing alternating leg lift plank. The woman then transitions to a traditional plank hold and continues to do side plank variations. Throughout the video, the woman demonstrates impressive strength and control as she performs each exercise with ease. Overall, the video is a great example of how to incorporate a variety of exercises into a workout routine.", "gt-answer": "B. performing alternating leg lift plank", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is performing push-ups, alternating leg lift plank, traditional plank hold, and side plank variations.", "chatgpt-answer": "A. performing push-ups, B. performing alternating leg lift plank, C. performing a traditional plank hold, D. performing side plank variations", "video-llm-prediction": "A woman is seen performing push-ups on a mat. She then transitions into performing alternating leg lift plank. The woman continues to perform a traditional plank hold and side plank variations.", "gt-answer": "B. performing alternating leg lift plank", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the woman is performing push-ups, alternating leg lift plank, traditional plank hold, and side plank variations.", "chatgpt-answer": "A. performing push-ups, B. performing alternating leg lift plank, C. performing a traditional plank hold, D. performing side plank variations", "video-llm-prediction": "A woman is seen performing push-ups on a blue mat. She then moves on to performing alternating leg lift plank and a traditional plank hold. The woman also performs side plank variations while maintaining her balance.", "gt-answer": "B. performing alternating leg lift plank", "rating": 0 } ] }, "1014976360": { "order": [ { "chatgpt-reasoning": "The video description states that the man is putting on his glasses and looking at his phone first, then he takes off his glasses and looks at his phone again.", "chatgpt-answer": "A. putting on his glasses and then looking at his phone", "video-llm-prediction": "A man is seen putting on his glasses and looking at his phone. He then takes off his glasses and looks at his phone again.", "gt-answer": "D. looking at his phone and then taking off his glasses", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man first puts on his glasses and then looks at his phone. After that, he takes off his glasses and looks at his phone again. So the correct order of events for the man is putting on his glasses and then looking at his phone.", "chatgpt-answer": "A. putting on his glasses and then looking at his phone", "video-llm-prediction": "The video shows a man putting on his glasses and looking at his phone. He then takes off his glasses and looks at his phone again.", "gt-answer": "D. looking at his phone and then taking off his glasses", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man first puts on his glasses and then looks at his phone. After that, he takes off his glasses and looks at his phone again.", "chatgpt-answer": "A. putting on his glasses and then looking at his phone", "video-llm-prediction": "A man is seen putting on his glasses and looking at his phone. He then takes off his glasses and looks at his phone again.", "gt-answer": "D. looking at his phone and then taking off his glasses", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen putting on his glasses and looking at his phone initially, then he takes off his glasses and looks at his phone again. This means that the correct order of events for the man is first putting on his glasses and then looking at his phone, followed by taking off his glasses and then looking at his phone again.", "chatgpt-answer": "A. putting on his glasses and then looking at his phone", "video-llm-prediction": "A man is seen putting on his glasses and looking at his phone. He then takes off his glasses and looks at his phone again.", "gt-answer": "D. looking at his phone and then taking off his glasses", "rating": 0 } ] }, "18416608": { "order": [ { "chatgpt-reasoning": "The video description clearly states that the woman first opens the bottle and takes a sip, then proceeds to use her tablet. Therefore, the correct order of actions is sampling water in a bottle first, then operating her tablet.", "chatgpt-answer": "C. sampling water in a bottle first, then operating her tablet", "video-llm-prediction": "A woman is seen kneeling down by a river, holding a bottle and a tablet. She opens the bottle and takes a sip, then proceeds to use her tablet. She then closes the bottle and continues to use her tablet.", "gt-answer": "C. sampling water in a bottle first, then operating her tablet", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is seen kneeling down by a river, operating her tablet, and then sampling water in a bottle. This indicates that she first operates her tablet and then samples water in a bottle.", "chatgpt-answer": "A. operating her tablet first, then sampling water in a bottle", "video-llm-prediction": "A woman is seen kneeling down by a river, operating her tablet, and then sampling water in a bottle. She repeats this process several times, and the video captures her actions in detail.", "gt-answer": "C. sampling water in a bottle first, then operating her tablet", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is simultaneously operating her tablet and sampling water in a bottle.", "chatgpt-answer": "B. the actions are performed simultaneously", "video-llm-prediction": "A woman is seen kneeling by a river, operating her tablet and sampling water in a bottle simultaneously.", "gt-answer": "C. sampling water in a bottle first, then operating her tablet", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman first opens the bottle and takes a sip, then proceeds to use her tablet. Therefore, the correct order of actions is \"sampling water in a bottle first, then operating her tablet.\"", "chatgpt-answer": "C. sampling water in a bottle first, then operating her tablet", "video-llm-prediction": "A woman is seen kneeling on the ground next to a river. She is holding a bottle and a tablet. She opens the bottle and takes a sip, then proceeds to use her tablet. She then closes the bottle and continues to use her tablet.", "gt-answer": "C. sampling water in a bottle first, then operating her tablet", "rating": 1 } ] }, "1061351290": { "order": [ { "chatgpt-reasoning": "The video description states that the woman is seen measuring her pregnant belly with a measuring tape first, then touching her belly, and later measuring her belly again with the measuring tape.", "chatgpt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "video-llm-prediction": "A woman is seen measuring her pregnant belly with a measuring tape. She then touches her belly and takes a nap. Later, she is seen measuring her belly again with the measuring tape.", "gt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the woman first measures her belly with a measuring tape, then touches her pregnant belly, takes a nap, and wakes up to continue measuring her belly with the measuring tape. The correct order of events is therefore D, touching her pregnant belly and then measuring her belly with a measuring tape.", "chatgpt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "video-llm-prediction": "A woman is seen measuring her pregnant belly with a measuring tape. She then touches her belly and takes a nap. Later, she wakes up and continues to measure her belly with the measuring tape.", "gt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "rating": 1 }, { "chatgpt-reasoning": "The video description provides a clear sequence of events. First, the woman is measuring her belly with a measuring tape. Then, she touches her pregnant belly. After that, she takes a nap. Lastly, she is seen measuring her belly again with the measuring tape.", "chatgpt-answer": "A. measuring her belly with a measuring tape and then touching her pregnant belly", "video-llm-prediction": "A woman is seen measuring her pregnant belly with a measuring tape. She then touches her belly and takes a nap. Later, she is seen measuring her belly again with the measuring tape.", "gt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is first measuring her pregnant belly with a measuring tape and then touching her belly.", "chatgpt-answer": "A. measuring her belly with a measuring tape and then touching her pregnant belly", "video-llm-prediction": "A woman is seen measuring her pregnant belly with a measuring tape and then touching her belly.", "gt-answer": "D. touching her pregnant belly and then measuring her belly with a measuring tape", "rating": 0 } ] }, "1066238617": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman is dancing, practicing her punches, and cooking in the same location.", "chatgpt-answer": "A. dancing", "video-llm-prediction": "A woman is seen dancing in the woods while wearing a black tank top. She is also seen practicing her punches and cooking in the same location.", "gt-answer": "B. practising her punches", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is dancing and practicing her punches in the woods.", "chatgpt-answer": "A. dancing", "video-llm-prediction": "The video features a woman who is seen dancing in the woods. She is wearing a black tank top and is surrounded by trees. The woman is also seen practicing her punches in the woods. The video captures the beauty of nature and the woman's movements are graceful and fluid. The woman's outfit is simple yet elegant, and her movements are in sync with the rhythm of the music. The video is a perfect representation of the beauty of nature and the joy of movement.", "gt-answer": "B. practising her punches", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is seen dancing in the woods while wearing a black tank top. It also mentions that she is practicing her punches and cooking in the same location. Therefore, the correct answer is A. dancing, as it is explicitly mentioned in the video description.", "chatgpt-answer": "A. dancing", "video-llm-prediction": "A woman is seen dancing in the woods while wearing a black tank top. She is also seen practicing her punches and cooking in the same location.", "gt-answer": "B. practising her punches", "rating": 0 }, { "chatgpt-reasoning": "Based on the video description, the woman is seen dancing in the woods while wearing a black tank top and practicing her punches. There is no mention of her cooking, so we can eliminate option C. Additionally, the video description specifically mentions that she is seen practicing her punches, so option B is correct.", "chatgpt-answer": "B. practising her punches", "video-llm-prediction": "A woman is seen dancing in the woods while wearing a black tank top. She is also seen practicing her punches and cooking in the same location.", "gt-answer": "B. practising her punches", "rating": 1 } ] }, "1072000366": { "action": [ { "chatgpt-reasoning": "Based on the video description, the girls are seen elbowing each other, giving each other a high five, waving at each other, and shaking hands. Therefore, all of the options A, B, C, and D can be considered as correct answers.", "chatgpt-answer": "A, B, C, D", "video-llm-prediction": "Two girls are seen in a hallway, and they are seen elbowing each other. They then give each other a high five. The girls are seen waving at each other and shaking hands.", "gt-answer": "A. elbowing each other", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girls are giving each other high fives.", "chatgpt-answer": "B. giving high five to each other", "video-llm-prediction": "Two girls are seen in a hallway, and they are wearing face masks. They are seen talking to each other, and they are also seen giving each other high fives. The girls seem to be enjoying each other's company, and they are also seen waving at each other. The video seems to be showing the girls' playful and friendly behavior towards each other.", "gt-answer": "A. elbowing each other", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the girls are seen elbowing each other and then giving each other a high five. This indicates that the correct answer is B - giving high five to each other.", "chatgpt-answer": "B. giving high five to each other", "video-llm-prediction": "Two girls are seen in a hallway, and they are seen elbowing each other. They then give each other a high five. The video seems to be a lighthearted moment between friends.", "gt-answer": "A. elbowing each other", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the girls are seen elbowing each other and then proceed to give each other a high five.", "chatgpt-answer": "A. elbowing each other, B. giving high five to each other", "video-llm-prediction": "Two girls are seen in a hallway, and they are seen elbowing each other. They then proceed to give each other a high five. The girls seem to be enjoying each other's company and are having a good time. The video captures the playful and lighthearted nature of the girls' interaction.", "gt-answer": "A. elbowing each other", "rating": 0 } ] }, "1065272113": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the doctor is taking the woman's blood pressure, checking her temperature, and giving her an injection.", "chatgpt-answer": "A. taking her blood pressure, B. checking her temperature, C. giving her an injection", "video-llm-prediction": "A doctor is seen taking a woman's blood pressure and checking her temperature. The doctor then proceeds to give her an injection.", "gt-answer": "C. giving her an injection", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the doctor is taking the woman's blood pressure, checking her temperature, and giving her an injection.", "chatgpt-answer": "A. taking her blood pressure, B. checking her temperature, C. giving her an injection", "video-llm-prediction": "The video depicts a doctor performing a medical procedure on a woman. The doctor is seen taking her blood pressure, checking her temperature, and giving her an injection. The woman appears to be in discomfort and is seen crying during the procedure. The video highlights the importance of medical professionals and the care they provide to their patients.", "gt-answer": "C. giving her an injection", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the doctor is taking the woman's blood pressure, checking her temperature, and giving her an injection.", "chatgpt-answer": "A. taking her blood pressure, B. checking her temperature, C. giving her an injection", "video-llm-prediction": "A doctor is seen taking a woman's blood pressure and checking her temperature. The doctor then proceeds to give her an injection.", "gt-answer": "C. giving her an injection", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the doctor is taking the woman's blood pressure, checking her temperature, and giving her an injection.", "chatgpt-answer": "A. taking her blood pressure, B. checking her temperature, C. giving her an injection", "video-llm-prediction": "A doctor is seen taking a woman's blood pressure and checking her temperature. She then proceeds to give the woman an injection.", "gt-answer": "C. giving her an injection", "rating": 0 } ] }, "1072971926": { "action": [ { "chatgpt-reasoning": "The video description mentions that the man is opening the pizza box, wrapping it, eating it, and then closing the pizza box.", "chatgpt-answer": "Option A. opening the pizza box", "video-llm-prediction": "A man is seen opening a pizza box, wrapping it, eating it, and then closing the pizza box.", "gt-answer": "A. opening the pizza box", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen opening the pizza box, wrapping it, eating it, and then closing the pizza box. This implies that the man is performing multiple actions with the pizza box, including opening it, wrapping it, eating the pizza, and finally closing the box.", "chatgpt-answer": "A. opening the pizza box\u3001B. wrapping the pizza box\u3001C. eating the pizza, D. closing the pizza box", "video-llm-prediction": "A man is seen opening a pizza box, wrapping it, eating it, and then closing the pizza box.", "gt-answer": "A. opening the pizza box", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man is performing several actions in a specific sequence - opening the pizza box, wrapping it, eating the pizza, and then closing the pizza box.", "chatgpt-answer": "D. closing the pizza box", "video-llm-prediction": "A man is seen opening a pizza box, wrapping it, eating it, and then closing the pizza box.", "gt-answer": "A. opening the pizza box", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen opening a pizza box, wrapping it, eating it, and then closing the pizza box. This implies that the man is performing these actions in sequence with the pizza box.", "chatgpt-answer": "D. closing the pizza box", "video-llm-prediction": "A man is seen opening a pizza box, wrapping it, eating it, and then closing the pizza box.", "gt-answer": "A. opening the pizza box", "rating": 0 } ] }, "3399348431": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is mixing vegetables in a bowl, squeezing juice into the bowl, and finally dipping the vegetables into the juice. This implies that the person is using the sauce to mix it with the vegetables and also dipping the vegetables in it.", "chatgpt-answer": "A. mixing it with the vegetables", "video-llm-prediction": "A person is seen mixing vegetables in a bowl. They then proceed to squeeze a juice into the bowl and mix it with the vegetables. Finally, they dip the vegetables into the juice.", "gt-answer": "B. squeezing it into a bowl of vegetables", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the person is squeezing the juice into the bowl and then mixing it with the vegetables. Finally, they dip the vegetables in the sauce.", "chatgpt-answer": "B. squeezing it into a bowl of vegetables", "video-llm-prediction": "A person is seen mixing vegetables in a bowl. They then proceed to squeeze a juice into the bowl and mix it with the vegetables. Finally, they dip the vegetables in the juice.", "gt-answer": "B. squeezing it into a bowl of vegetables", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the person is mixing vegetables in a bowl, squeezing juice into the bowl, and then dipping the vegetables into the juice. Therefore, the person is doing all three actions with the sauce - mixing it with the vegetables, squeezing it into a bowl of vegetables, and dipping vegetables in it.", "chatgpt-answer": "A. mixing it with the vegetables", "video-llm-prediction": "A person is seen mixing vegetables in a bowl. They then squeeze a juice into the bowl and mix it with the vegetables. Finally, they dip the vegetables into the juice.", "gt-answer": "B. squeezing it into a bowl of vegetables", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the person is mixing vegetables in a bowl, squeezing a juice into the bowl, and dipping vegetables in it. This implies that the person is using the sauce in all these actions - mixing it with the vegetables, squeezing it into a bowl of vegetables, and dipping vegetables in it.", "chatgpt-answer": "A. mixing it with the vegetables", "video-llm-prediction": "A person is seen mixing vegetables in a bowl, squeezing a juice into the bowl, and dipping vegetables in it.", "gt-answer": "B. squeezing it into a bowl of vegetables", "rating": 0 } ] }, "1025137214": { "action": [ { "chatgpt-reasoning": "The video description mentions that the man is seen walking down a street while smoking a cigarette. It also states that he then sits down and talks on the phone. This indicates that the man is doing multiple actions in the video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A man is seen walking down a street while smoking a cigarette. He then sits down and talks on the phone.", "gt-answer": "B. smoking cigarette", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is walking down a street while smoking a cigarette, and then he sits down and talks on his phone. Therefore, all three activities mentioned in the choices (walking, smoking cigarette, talking on the phone) are correct.", "chatgpt-answer": "A. walking, B. smoking cigarette, C. talking on the phone", "video-llm-prediction": "A man is seen walking down a street while smoking a cigarette. He then sits down and talks on his phone.", "gt-answer": "B. smoking cigarette", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is seen smoking a cigarette while laying on the ground. It implies that he is performing the action of smoking a cigarette.", "chatgpt-answer": "B. smoking cigarette", "video-llm-prediction": "A man is seen smoking a cigarette while laying on the ground. He then gets up and walks away.", "gt-answer": "B. smoking cigarette", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is seen walking down the street while smoking a cigarette, and then he sits down and talks on his phone. Therefore, the correct answer is C. talking on the phone.", "chatgpt-answer": "C. talking on the phone", "video-llm-prediction": "A man is seen walking down the street while smoking a cigarette. He then sits down and talks on his phone.", "gt-answer": "B. smoking cigarette", "rating": 0 } ] }, "1033101626": { "action": [ { "chatgpt-reasoning": "The video description mentions that the man is playing a musical instrument.", "chatgpt-answer": "C. playing instrument", "video-llm-prediction": "A man is seen sitting on a rock by the ocean, playing a musical instrument. He is wearing a blue shirt and is surrounded by rocks. The man is seen playing the instrument in different positions, including sitting on the ground and on a rock. The video captures the serene and peaceful atmosphere of the location, with the sound of the waves crashing against the rocks in the background.", "gt-answer": "C. playing instrument", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is playing a musical instrument.", "chatgpt-answer": "C. playing instrument", "video-llm-prediction": "A man is seen sitting on a rock, playing a musical instrument. He is wearing a blue shirt and is positioned in front of a beautiful view of the ocean. The man continues to play the instrument while looking out at the water.", "gt-answer": "C. playing instrument", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is holding a stick and playing it, which implies that he is playing an instrument. Additionally, the description also states that he is cooking and singing, but there is no mention of him specifically doing those activities.", "chatgpt-answer": "C. playing instrument", "video-llm-prediction": "A man is seen sitting in a cave, holding a stick and playing it. He is also seen cooking and singing.", "gt-answer": "C. playing instrument", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the man is playing a musical instrument. There are no indications of him cooking or singing in the video.", "chatgpt-answer": "C. playing instrument", "video-llm-prediction": "A man is seen sitting on a rock, playing a musical instrument. The camera captures the beautiful scenery of the ocean in the background. The man continues to play the instrument, and the camera pans around the area, showing the beauty of the surroundings. The video ends with the man finishing playing the instrument.", "gt-answer": "C. playing instrument", "rating": 1 } ] }, "9537677": { "action": [ { "chatgpt-reasoning": "The video description states that the woman is initially reading a book, then switches to watching TV and playing with her tablet, and later she is seen cooking. Therefore, the correct answer would be D. cooking, as it is the last activity mentioned in the video description.", "chatgpt-answer": "D. cooking", "video-llm-prediction": "A woman is seen sitting on a bench and reading a book. She then switches to watching TV and playing with her tablet. Later, she is seen cooking.", "gt-answer": "C. playing tablet", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the woman is seen sitting on a bench, reading a book. Additionally, it mentions that she puts the book down and picks up her phone to start texting, implying that her primary activity is reading a book.", "chatgpt-answer": "A. reading a book", "video-llm-prediction": "A woman is seen sitting on a bench, reading a book. She then puts the book down and picks up her phone to start texting. The woman seems to be enjoying her time alone, taking a break from her busy life to relax and unwind. The bench she is sitting on is located in a park, surrounded by trees and greenery. The woman's outfit suggests that she is dressed casually, perhaps for a day of leisure. Overall, the video captures a peaceful moment of a woman taking a break from her daily routine to enjoy some quiet time.", "gt-answer": "C. playing tablet", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is sitting on a bench and reading a book. It also states that she switches to watching TV and playing with her tablet. Therefore, the correct answer would be A. reading a book.", "chatgpt-answer": "A. reading a book", "video-llm-prediction": "A woman is seen sitting on a bench and reading a book. She then switches to watching TV and playing with her tablet.", "gt-answer": "C. playing tablet", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the woman is initially reading a book, then switches to watching TV, and finally playing with her tablet.", "chatgpt-answer": "C. playing tablet", "video-llm-prediction": "A woman is seen sitting on a bench, reading a book. She then switches to watching TV, and finally, she is seen playing with her tablet.", "gt-answer": "C. playing tablet", "rating": 1 } ] }, "1077388994": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman is holding a baby in her arms, patting the baby's back, singing to the baby, and dancing around the room. Therefore, all three actions mentioned in the choices (singing, dancing, and patting the baby) are being performed by the woman.", "chatgpt-answer": "A. singing, B. dancing, C. patting the baby", "video-llm-prediction": "A woman is seen holding a baby in her arms and patting the baby's back. She then sings to the baby and dances around the room.", "gt-answer": "C. patting the baby", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly mentions that the woman is holding a baby in her arms and patting the baby's back. It also states that she sings to the baby and dances with the baby in her arms. Therefore, the correct answer is C. patting the baby.", "chatgpt-answer": "C. patting the baby", "video-llm-prediction": "A woman is seen holding a baby in her arms and patting the baby's back. She then sings to the baby and dances with the baby in her arms. The video captures the tender moments between the woman and the baby.", "gt-answer": "C. patting the baby", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the woman is holding a baby in her arms, patting the baby's back, singing to the baby, and dancing around the room. Therefore, all three actions mentioned (singing, dancing, patting the baby) are correct.", "chatgpt-answer": "A. singing, B. dancing, C. patting the baby", "video-llm-prediction": "A woman is seen holding a baby in her arms and patting the baby's back. She then sings to the baby and dances around the room.", "gt-answer": "C. patting the baby", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the woman is holding a baby and patting it while singing. This suggests that the action she is performing is patting the baby while singing.", "chatgpt-answer": "C. patting the baby", "video-llm-prediction": "A woman is seen holding a baby and patting it while singing.", "gt-answer": "C. patting the baby", "rating": 1 } ] }, "1037531786": { "action": [ { "chatgpt-reasoning": "The video description clearly states that two men are boxing in a ring and that one of the men is seen punching the other man in the face. This indicates that the two men are engaged in a boxing match.", "chatgpt-answer": "C. boxing", "video-llm-prediction": "Two men are seen boxing in a ring. One of the men is wearing a white shirt and the other is wearing a black shirt. The man in the black shirt is seen punching the other man in the face.", "gt-answer": "C. boxing", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that two men are boxing in a ring, with one wearing a white shirt and the other wearing a black shirt. It describes various actions related to boxing, such as one man punching the other man in the face and both men punching each other.", "chatgpt-answer": "C. boxing", "video-llm-prediction": "Two men are seen boxing in a ring, with one of them wearing a white shirt and the other wearing a black shirt. The man in the black shirt is seen punching the other man in the face, while the man in the white shirt is seen punching the man in the black shirt. The man in the black shirt is also seen punching the man in the white shirt.", "gt-answer": "C. boxing", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that two men are boxing in a ring.", "chatgpt-answer": "C. boxing", "video-llm-prediction": "Two men are seen boxing in a ring.", "gt-answer": "C. boxing", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that two men are boxing in a ring, with one wearing a white shirt and the other wearing a black shirt. It describes the actions of both men as punching each other, which aligns with the activity of boxing.", "chatgpt-answer": "C. boxing", "video-llm-prediction": "Two men are seen boxing in a ring, with one wearing a white shirt and the other wearing a black shirt. The man in the black shirt is seen punching the other man in the face, while the man in the white shirt is seen punching the man in the black shirt. The man in the black shirt is also seen punching the man in the white shirt.", "gt-answer": "C. boxing", "rating": 1 } ] }, "1077275024": { "action": [ { "chatgpt-reasoning": "The video description clearly mentions that the little girl is clapping her hands in front of a man playing the ukulele.", "chatgpt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "A little girl wearing a blue dress is seen clapping her hands in front of a man playing the ukulele. The man is wearing a yellow shirt and is playing the ukulele while sitting on the grass. The little girl is seen jumping and dancing in front of the man while he plays the ukulele. The man is also seen playing the ukulele while the little girl is clapping her hands. The video captures the joyful and playful atmosphere of the moment.", "gt-answer": "C. Clapping hands for a man playing ukulele", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the girl is seen clapping her hands in front of a man playing the ukulele. There is no mention of jumping or dancing, only that she continues to clap her hands.", "chatgpt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "A young girl wearing a blue dress and a red bow in her hair is seen clapping her hands in front of a man playing the ukulele. The man is wearing a yellow shirt and is playing the ukulele while sitting on the grass. The girl continues to clap her hands and dances around while the man plays the ukulele. The video captures the joyful and playful atmosphere of the moment.", "gt-answer": "C. Clapping hands for a man playing ukulele", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the little girl is jumping and clapping for a man playing the ukulele. This means that she is both jumping and clapping, but there is no mention of her dancing. Therefore, the correct answer is C. Clapping hands for a man playing ukulele.", "chatgpt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "A little girl jumps and claps for a man playing the ukulele.", "gt-answer": "C. Clapping hands for a man playing ukulele", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly mentions that the girl is clapping her hands in front of a man who is playing the ukulele.", "chatgpt-answer": "C. Clapping hands for a man playing ukulele", "video-llm-prediction": "A young girl wearing a blue dress and a red bow in her hair is seen clapping her hands in front of a man who is playing the ukulele. The man is wearing a yellow shirt and is playing the ukulele while sitting on the grass. The girl continues to clap her hands while the man plays the ukulele.", "gt-answer": "C. Clapping hands for a man playing ukulele", "rating": 1 } ] }, "1107180099": { "action": [ { "chatgpt-reasoning": "The video description clearly mentions that a group of women are seen dancing on a court. They are described as performing a choreography that involves moving their hands and legs in a synchronized manner. The description also mentions that they are doing a handstand and clapping their hands at the end.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of women are seen dancing on a court. They are wearing black and yellow tops and black shorts. The women are performing a choreography that involves moving their hands and legs in a synchronized manner. The women are also seen doing a handstand on the court. The video ends with the women standing in a straight line and clapping their hands.", "gt-answer": "C. dancing", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the group of women are seen dancing on a court, moving their arms and legs in unison.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of women are seen dancing on a court. They move their arms and legs in unison, creating a beautiful and mesmerizing display. The women seem to be enjoying themselves, as they laugh and smile at each other. The dance is graceful and fluid, with the women moving in perfect harmony with each other. The court is surrounded by trees and bushes, creating a serene and peaceful atmosphere. The women's movements are so precise that it seems as though they are one entity, moving as one. Overall, the video captures a beautiful moment of women coming together to dance and enjoy", "gt-answer": "C. dancing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a group of women are seen dancing on a court. They are described as performing a routine that involves jumping and spinning, and doing a handstand. This indicates that the women are engaged in dancing.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of women are seen dancing on a court. They are wearing pink tops and black bottoms. They are performing a routine that involves jumping and spinning. The women are also seen doing a handstand on the court.", "gt-answer": "C. dancing", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a group of women are seen dancing on a court, moving their arms and legs in unison and creating a beautiful and synchronized dance routine.", "chatgpt-answer": "C. dancing", "video-llm-prediction": "A group of women are seen dancing on a court. They move their arms and legs in unison, creating a beautiful and synchronized dance routine. The women seem to be enjoying themselves, and their movements are fluid and graceful. The court is surrounded by a green field, and the sun is shining brightly in the sky, creating a perfect setting for the dance. The women's outfits are colorful, and they seem to be wearing comfortable clothes that allow them to move freely. Overall, the video captures a beautiful moment of women coming together to dance and enjoy each other's company", "gt-answer": "C. dancing", "rating": 1 } ] }, "1049434159": { "action": [ { "chatgpt-reasoning": "The video description mentions that the man and woman are sitting on a couch with a little girl, smiling and laughing. The man is holding a remote control and the little girl is holding a camera. This suggests that they are spending quality time together, possibly taking pictures or recording a video.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "The video shows a man and a woman sitting on a couch with a little girl. The man is holding a remote control, and the little girl is holding a camera. They are all smiling and laughing. The video seems to be a family moment where they are enjoying each other's company. The man and the woman seem to be the parents of the little girl, and they are spending quality time together. The little girl is holding a camera, which suggests that they might be taking pictures or recording a video. The video seems to be a heartwarming moment of a family enjoying each other's", "gt-answer": "B. playing video games", "rating": 0 }, { "chatgpt-reasoning": "The video description clearly states that the man and woman, along with their daughter, are playing video games together. It mentions that they are sitting on a couch, holding remote controls, and capturing joyful moments while playing.", "chatgpt-answer": "B. playing video games", "video-llm-prediction": "The video shows a man and a woman sitting on a couch with a little girl, and they are playing video games together. The man is holding a remote control in his hand, and the little girl is also holding a remote control. The man is wearing a yellow hoodie, and the little girl is wearing a white shirt. The video captures the joyful moments of the family playing video games together.", "gt-answer": "B. playing video games", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is playing a video game while the little girl is watching him. This indicates that the parents and daughter are playing video games together.", "chatgpt-answer": "B. playing video games", "video-llm-prediction": "The video shows a man and a woman sitting on a couch with a little girl. The man is holding a remote control, and the little girl is holding a toy remote control. The man is playing a video game while the little girl is watching him.", "gt-answer": "B. playing video games", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man, woman, and little girl are playing video games together.", "chatgpt-answer": "B. playing video games", "video-llm-prediction": "A man and a woman are sitting on a couch with a little girl, and they are playing video games together. The little girl is holding a game controller and smiling.", "gt-answer": "B. playing video games", "rating": 1 } ] }, "3402234027": { "action": [ { "chatgpt-reasoning": "The video description mentions that the cat is eating food on the ground.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A cat is seen eating food on the ground.", "gt-answer": "C. eating food", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the cat is eating food on the ground.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A cat is seen eating food on the ground.", "gt-answer": "C. eating food", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the cat is \"eating food while sitting on the ground\".", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A cat is seen eating food while sitting on the ground.", "gt-answer": "C. eating food", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the cat is eating food, playing with a toy and also sleeping.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A cat is seen eating food while sitting on the ground. The cat is also seen sleeping and playing with a toy.", "gt-answer": "C. eating food", "rating": 1 } ] }, "1056491306": { "action": [ { "chatgpt-reasoning": "The video description mentions that some passengers are sleeping on the bed, some are standing in a room, one man is taking a seat on the subway, and another man is dancing on the stage.", "chatgpt-answer": "A. sleeping on the bed, C. taking a seat on subway, D. dancing on the stage", "video-llm-prediction": "The video shows passengers on a subway train, with some of them sleeping on the bed and others standing in a room. One man is seen taking a seat on the subway while another is dancing on the stage. The video also shows passengers wearing face masks while sitting on the train.", "gt-answer": "C. taking a seat on subway", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the passengers are sitting in chairs and looking at their phones. It also mentions that the train is filled with people wearing face masks. Based on this information, we can conclude that the passengers are taking a seat on the subway.", "chatgpt-answer": "C. taking a seat on subway", "video-llm-prediction": "A man wearing a blue shirt and black pants is seen sitting on a subway train, wearing a blue face mask. He is seen looking at his phone and then looking out the window. The train is filled with people who are also wearing face masks. The man is seen sitting in a chair, looking at his phone, and then looking out the window. He is also seen sitting in a chair, looking at his phone, and then looking out the window.", "gt-answer": "C. taking a seat on subway", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that a man wearing a blue shirt and black pants is sitting on a blue seat in a subway train. It also mentions that the man is seen sleeping on the bed while wearing a blue medical mask. From this, we can infer that the passengers are taking a seat on the subway.", "chatgpt-answer": "C. taking a seat on subway", "video-llm-prediction": "A man wearing a blue shirt and black pants is sitting on a blue seat in a subway train. He is wearing a blue medical mask and holding a red and white toy in his hand. The man is seen sleeping on the bed while wearing a blue medical mask.", "gt-answer": "C. taking a seat on subway", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the passengers are on a subway train. It also states that the man is seen sitting on a bench with his back turned to the camera, which indicates that he is taking a seat on the subway.", "chatgpt-answer": "C. taking a seat on subway", "video-llm-prediction": "A man wearing a blue shirt and black pants is seen sitting on a subway train, wearing a face mask. He is seen looking at his phone and then looking out the window. The train is filled with passengers who are also wearing face masks. The man is seen sitting on a bench with his back turned to the camera.", "gt-answer": "C. taking a seat on subway", "rating": 1 } ] }, "1012085909": { "action": [ { "chatgpt-reasoning": "The video description mentions that the group of people is riding bikes on a dirt road, pushing their bikes up a hill, and one person is seen riding a bike. None of the other choices are mentioned in the video description.", "chatgpt-answer": "C. pushing bikes up a hill", "video-llm-prediction": "The video shows a group of people riding bikes on a dirt road. They are seen pushing their bikes up a hill, and one person is seen riding a bike. The video also shows a person walking on the street.", "gt-answer": "C. pushing bikes up a hill", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the group of people is riding bikes on a dirt road and pushing their bikes up a hill.", "chatgpt-answer": "C. pushing bikes up a hill", "video-llm-prediction": "The video shows a group of people riding bikes on a dirt road. They are seen pushing their bikes up a hill, and the camera captures their movements as they continue to ride. The video also shows a man in a yellow shirt standing on the side of the road, and a woman in a blue shirt standing next to a bike. The video seems to be focused on the group of people riding bikes and their journey on the dirt road.", "gt-answer": "C. pushing bikes up a hill", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that a group of people are seen walking up a hill while pushing their bikes. This indicates that they are pushing bikes up a hill.", "chatgpt-answer": "C. pushing bikes up a hill", "video-llm-prediction": "A group of people are seen walking up a hill while pushing their bikes. They are wearing helmets and backpacks.", "gt-answer": "C. pushing bikes up a hill", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the people are seen walking on a dirt road and pushing their bikes up a hill. This implies that they are engaged in the activity of pushing bikes up a hill.", "chatgpt-answer": "C. pushing bikes up a hill", "video-llm-prediction": "A group of people are seen walking on a dirt road, pushing their bikes up a hill. They seem to be enjoying the scenery around them.", "gt-answer": "C. pushing bikes up a hill", "rating": 1 } ] }, "1079406734": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is washing his car in a parking lot. He is spraying the car with a hose, washing it with soap, rinsing it with water, drying it with a cloth, and cleaning the rims with a brush.", "chatgpt-answer": "C. washing the car", "video-llm-prediction": "A man is seen washing his car in a parking lot. He starts by spraying the car with a hose and then proceeds to wash the car with soap. After that, he rinses the car with water and then dries it with a cloth. Finally, he cleans the rims of the car with a brush.", "gt-answer": "C. washing the car", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is washing his car in a parking lot. The description provides details of the process, including spraying the car with a hose, washing it with soap, rinsing it with water, and using a blow dryer to dry it.", "chatgpt-answer": "C. washing the car", "video-llm-prediction": "A man is seen washing his car in a parking lot. He starts by spraying the car with a hose and then proceeds to wash the car with soap. He then rinses the car with water and uses a blow dryer to dry the car. The man is seen standing next to his car, and he is wearing a black shirt and black shoes. The video captures the man's attention to detail as he cleans his car thoroughly. The parking lot is surrounded by trees, and there are several cars parked in the background. Overall, the video showcases", "gt-answer": "C. washing the car", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is washing his car with a hose and soap, rinses it with water, and dries it with a cloth. This indicates that he is performing the task of cleaning or washing the car.", "chatgpt-answer": "C. washing the car", "video-llm-prediction": "A man is seen washing his car with a hose and soap. He then rinses the car with water and dries it with a cloth.", "gt-answer": "C. washing the car", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen washing his car in a parking lot. He sprays the car with a hose, cleans it with a sponge, rinses it with the hose, and dries it with a cloth.", "chatgpt-answer": "C. washing the car", "video-llm-prediction": "A man is seen washing his car in a parking lot. He sprays the car with a hose and then uses a sponge to clean the car. He then rinses the car with the hose and dries it with a cloth.", "gt-answer": "C. washing the car", "rating": 1 } ] }, "1022115337": { "order": [ { "chatgpt-reasoning": "The video description explicitly states that the girl is \"dancing and then sending an air kiss\". This implies that the dancing occurs before the air kiss.", "chatgpt-answer": "A. dancing and then sending an air kiss", "video-llm-prediction": "A young girl wearing a sparkly dress is seen dancing and then sending an air kiss.", "gt-answer": "A. dancing and then sending an air kiss", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the young girl is seen dancing and then sending an air kiss. This indicates that the events happen sequentially, with dancing happening before sending an air kiss.", "chatgpt-answer": "A. dancing and then sending an air kiss", "video-llm-prediction": "A young girl wearing a sparkly dress is seen dancing and then sending an air kiss.", "gt-answer": "A. dancing and then sending an air kiss", "rating": 1 }, { "chatgpt-reasoning": "The video description specifies that the young girl first dances and then sends an air kiss.", "chatgpt-answer": "A. dancing and then sending an air kiss", "video-llm-prediction": "A young girl wearing a sparkly dress dances and then sends an air kiss.", "gt-answer": "A. dancing and then sending an air kiss", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the young girl is seen dancing and then sending an air kiss.", "chatgpt-answer": "A. dancing and then sending an air kiss", "video-llm-prediction": "A young girl wearing a sparkly dress is seen dancing and then sending an air kiss.", "gt-answer": "A. dancing and then sending an air kiss", "rating": 1 } ] }, "1071214909": { "action": [ { "chatgpt-reasoning": "The video description states that the person is carving a design on the wooden surface, measuring the length of the surface, drawing a cutting line, and sanding the surface to make it smoother.", "chatgpt-answer": "A. carving a design", "video-llm-prediction": "A person is seen carving a design on a wooden surface. They measure the length of the surface and draw a cutting line. Then, they sand the surface to make it smoother.", "gt-answer": "C. drawing a cutting line", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is carving a design, measuring the length, drawing a cutting line, and sanding the surface. All of these actions are being performed on the wood surface.", "chatgpt-answer": "A. carving a design", "video-llm-prediction": "A person is seen carving a design on a wooden surface, measuring the length of the surface, drawing a cutting line, and sanding the surface.", "gt-answer": "C. drawing a cutting line", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the person is carving a design on the wooden surface using a tool, measuring the length of the surface, drawing a cutting line, and sanding the surface to make it smoother.", "chatgpt-answer": "A. carving a design", "video-llm-prediction": "A person is seen carving a design on a wooden surface using a tool. They then measure the length of the surface and draw a cutting line. After that, they sand the surface to make it smoother.", "gt-answer": "C. drawing a cutting line", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly states that the person is carving a design, measuring the length, drawing a cutting line, and sanding the surface of the wood.", "chatgpt-answer": "A. carving a design", "video-llm-prediction": "A person is seen carving a design on a wooden surface, measuring the length, drawing a cutting line, and sanding the surface.", "gt-answer": "C. drawing a cutting line", "rating": 0 } ] }, "1092065543": { "action": [ { "chatgpt-reasoning": "The video description clearly states that the man is shown shopping for vegetables in a store. He picks up boxes of cucumbers, tomatoes, and peppers and puts them in his bag.", "chatgpt-answer": "B. shopping", "video-llm-prediction": "A man is shown shopping for vegetables in a store. He picks up a box of cucumbers and a box of tomatoes, and then proceeds to put the cucumbers in his bag. He then picks up a box of peppers and puts them in his bag as well.", "gt-answer": "B. shopping", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the man is shopping for vegetables at a store.", "chatgpt-answer": "B. shopping", "video-llm-prediction": "A man is seen shopping for vegetables at a store. He picks up a box of cucumbers and a box of tomatoes and puts them in his bag.", "gt-answer": "B. shopping", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is shopping for vegetables and eating them.", "chatgpt-answer": "A. eating", "video-llm-prediction": "A man is seen shopping for vegetables and eating them.", "gt-answer": "B. shopping", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the man is shopping for vegetables at a store, picking up cucumbers and tomatoes and putting them in his bag.", "chatgpt-answer": "B. shopping", "video-llm-prediction": "A man is seen shopping for vegetables at a store. He picks up a box of cucumbers and a box of tomatoes, and then proceeds to put them in his bag.", "gt-answer": "B. shopping", "rating": 1 } ] }, "1017063703": { "action": [ { "chatgpt-reasoning": "The video description mentions that the person is seen decorating cakes with a piping bag, filling them with cream, and decorating them with chocolate shavings. The video also ends with the person presenting the cakes to guests.", "chatgpt-answer": "B. decorating cakes", "video-llm-prediction": "A person in blue gloves is seen decorating cakes with a piping bag. The person is seen filling the cakes with cream and then decorating them with chocolate shavings. The video ends with the person presenting the cakes to guests.", "gt-answer": "B. decorating cakes", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the person is seen decorating cakes in a kitchen using a piping bag. It also explicitly states that the video showcases the process of baking and decorating cakes. Therefore, the correct answer is B. decorating cakes.", "chatgpt-answer": "B. decorating cakes", "video-llm-prediction": "A person wearing blue gloves is seen decorating cakes in a kitchen. The person is seen using a piping bag to decorate the cakes. The video showcases the process of baking and decorating cakes in a kitchen. The person is seen using a piping bag to decorate the cakes, and the video provides a glimpse into the process of baking and decorating cakes. The video is a great resource for anyone interested in baking and decorating cakes.", "gt-answer": "B. decorating cakes", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the person is decorating cakes with a piping bag.", "chatgpt-answer": "B. decorating cakes", "video-llm-prediction": "A person wearing blue gloves is seen decorating cakes with a piping bag. The video showcases the process of baking and decorating cakes.", "gt-answer": "B. decorating cakes", "rating": 1 }, { "chatgpt-reasoning": "The video description specifically mentions that the person is decorating cakes with white frosting and black crumbs, cutting the cakes, and presenting them to guests.", "chatgpt-answer": "B. decorating cakes", "video-llm-prediction": "A person in blue gloves is seen decorating cakes with white frosting and black crumbs. The person is also seen cutting and presenting the cakes to guests.", "gt-answer": "B. decorating cakes", "rating": 1 } ] }, "1055022287": { "action": [ { "chatgpt-reasoning": "The video description explicitly states that the man is cleaning a swimming pool with a blue hose.", "chatgpt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "A man is seen cleaning a swimming pool with a blue hose while wearing a black shirt and blue jeans. He is also holding a blue hose in his hand.", "gt-answer": "C. cleaning a swimming pool", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly mentions that the man is cleaning a swimming pool with a blue hose. None of the other choices (cooking, singing) are mentioned or relevant to the video description.", "chatgpt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "A man is seen cleaning a swimming pool with a blue hose. He is wearing a black shirt and blue jeans. The man is seen cleaning the pool while standing on a wooden deck. The pool is surrounded by a white chair and a potted plant. The man is also seen cleaning the pool with a blue hose.", "gt-answer": "C. cleaning a swimming pool", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen cleaning a swimming pool. None of the other choices are mentioned in the description.", "chatgpt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "A man is seen cleaning a swimming pool with a blue hose. He is wearing a black shirt and blue jeans. The man is seen cleaning the pool while standing on a wooden deck.", "gt-answer": "C. cleaning a swimming pool", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the man is seen cleaning a swimming pool with a blue hose. The description also provides details about the man's attire and the environment in which he is cleaning.", "chatgpt-answer": "C. cleaning a swimming pool", "video-llm-prediction": "A man is seen cleaning a swimming pool with a blue hose. He is wearing a black shirt and blue jeans. The man is seen cleaning the pool while standing on a wooden deck. He is also seen cleaning the pool while standing on a wooden platform. The man is seen cleaning the pool while standing on a wooden deck.", "gt-answer": "C. cleaning a swimming pool", "rating": 1 } ] }, "1094259081": { "action": [ { "chatgpt-reasoning": "The video description mentions that the woman is wearing a VR headset and using it to watch a movie, listen to music, play a VR shooting game, and work out. Therefore, all of the choices are correct.", "chatgpt-answer": "A. watching VR movie, B. listening to music using VR, C. playing VR shooting game, D. working out using VR", "video-llm-prediction": "A woman is seen wearing a VR headset and using it to watch a movie, listen to music, play a VR shooting game, and work out.", "gt-answer": "C. playing VR shooting game", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is wearing a VR headset and playing a VR game. Additionally, it states that she is holding a remote control and moving her body while playing the game. These details suggest that she is actively engaged in gameplay rather than watching a movie or listening to music. The immersive experience mentioned also indicates that she is likely involved in some kind of interactive activity, such as playing a shooting game or working out using VR.", "chatgpt-answer": "C. playing VR shooting game", "video-llm-prediction": "A woman is seen wearing a VR headset and playing a VR game. She is seen holding a remote control and moving her body while playing the game. The video showcases the woman's immersive experience while playing the game.", "gt-answer": "C. playing VR shooting game", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the woman is wearing a VR headset and using it to watch a movie, listen to music, play a VR shooting game, and work out. Therefore, all the choices are correct.", "chatgpt-answer": "A. watching VR movie, B. listening to music using VR, C. playing VR shooting game, D. working out using VR", "video-llm-prediction": "A woman is seen wearing a VR headset and using it to watch a movie, listen to music, play a VR shooting game, and work out.", "gt-answer": "C. playing VR shooting game", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the woman is wearing a VR headset, holding a remote control, and moving her arms around as if she is holding a gun. This suggests that she is playing a video game, specifically a shooting game.", "chatgpt-answer": "C. playing VR shooting game", "video-llm-prediction": "A woman is seen sitting on a couch and wearing a VR headset. She is holding a remote control in her hand and appears to be playing a video game. The woman is fully immersed in the game and is seen moving her arms around as if she is holding a gun. The video captures the woman's intense concentration as she plays the game.", "gt-answer": "C. playing VR shooting game", "rating": 1 } ] }, "1022260408": { "action": [ { "chatgpt-reasoning": "The video description mentions that the squirrel is eating food while sitting on a rock, as well as running and sleeping in different locations.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "The video shows a squirrel eating food while sitting on a rock. The squirrel is seen running and sleeping in different locations.", "gt-answer": "C. eating food", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the squirrel is eating food in a tree.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A squirrel is seen eating food in a tree.", "gt-answer": "C. eating food", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the squirrel is seen \"eating food in the video\". Based on this information, we can conclude that the correct answer is C. eating food.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A squirrel is seen eating food in the video.", "gt-answer": "C. eating food", "rating": 1 }, { "chatgpt-reasoning": "The video description explicitly states that the squirrel is eating food.", "chatgpt-answer": "C. eating food", "video-llm-prediction": "A squirrel is seen eating food in the video.", "gt-answer": "C. eating food", "rating": 1 } ] }, "1089810969": { "action": [ { "chatgpt-reasoning": "The video description mentions that the little girl runs towards her mother and hugs her. This indicates that the little girl interacts by running towards her and hugging her.", "chatgpt-answer": "A. she runs towards her and hugs her", "video-llm-prediction": "In the video, a little girl is seen running towards her mother and hugging her. The mother then walks with the little girl and hugs her again. The video captures the heartwarming moment of a mother and daughter bonding.", "gt-answer": "A. she runs towards her and hugs her", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the little girl is seen running towards her mother and hugging her.", "chatgpt-answer": "A. she runs towards her and hugs her", "video-llm-prediction": "In the video, a little girl is seen running towards her mother and hugging her. The mother then walks with her daughter and hugs her again. The video captures the heartwarming moment between a mother and her daughter.", "gt-answer": "A. she runs towards her and hugs her", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the little girl runs towards her mother and hugs her tightly. This indicates that she interacts with the woman by running towards her and hugging her.", "chatgpt-answer": "A. she runs towards her and hugs her", "video-llm-prediction": "A little girl runs towards her mother and hugs her tightly. The mother then walks with her daughter and hugs her again. The little girl then runs towards her father and hugs him tightly. The father then walks with his daughter and hugs her again.", "gt-answer": "A. she runs towards her and hugs her", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the little girl runs towards her mother and hugs her tightly. Additionally, it mentions that the little girl runs towards her mother again and jumps on her back, showing her playful and affectionate nature. Therefore, the correct answer is C - she runs towards her and jumps on her back.", "chatgpt-answer": "C. she runs towards her and jumps on her back", "video-llm-prediction": "A little girl runs towards her mother and hugs her tightly, showing her love and affection. The mother, who is wearing a black shirt, is seen walking down a sidewalk with her daughter. The little girl then runs towards her again and jumps on her back, showing her playful and affectionate nature. The mother, who is wearing a white shirt, is seen walking down the sidewalk with her daughter again. The video captures the heartwarming moments of a mother and daughter spending quality time together.", "gt-answer": "A. she runs towards her and hugs her", "rating": 0 } ] }, "6165731": { "action": [ { "chatgpt-reasoning": "The video description states that the scientist is initially observing quietly on the experiment, then proceeds to leisurely conduct the experiments. However, it also mentions that he becomes frustrated and confused about the experiment.", "chatgpt-answer": "C. looking confused and frustrated about the experiment", "video-llm-prediction": "A scientist is shown observing quietly on an experiment. He then proceeds to leisurely conduct the experiments. However, he becomes frustrated and confused about the experiment.", "gt-answer": "C. looking confused and frustrated about the experiment", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the scientist is observing quietly on an experiment, and then proceeds to conduct the experiment leisurely. Additionally, it mentions that the scientist looks confused and frustrated about the outcome of the experiment.", "chatgpt-answer": "B. leisurely conducting experiments", "video-llm-prediction": "A scientist is seen observing quietly on an experiment. He then leisurely conducts the experiment, looking confused and frustrated about the outcome.", "gt-answer": "C. looking confused and frustrated about the experiment", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the scientist is observed quietly on the experiment and later leisurely conducts the experiment. It also mentions that he looks confused and frustrated about the outcome.", "chatgpt-answer": "C. looking confused and frustrated about the experiment", "video-llm-prediction": "A scientist is seen observing quietly on an experiment. He then leisurely conducts the experiment. However, he looks confused and frustrated about the outcome.", "gt-answer": "C. looking confused and frustrated about the experiment", "rating": 1 }, { "chatgpt-reasoning": "The video description clearly states that the scientist is \"observing quietly on an experiment.\" It also mentions that another scientist is \"leisurely conducting experiments\" and the third scientist is \"looking confused and frustrated about the experiment.\" Therefore, the correct answer is A. observing quietly on the experiment.", "chatgpt-answer": "A. observing quietly on the experiment", "video-llm-prediction": "A scientist is seen observing quietly on an experiment, while another scientist is leisurely conducting experiments. The third scientist is looking confused and frustrated about the experiment.", "gt-answer": "C. looking confused and frustrated about the experiment", "rating": 0 } ] }, "1111469465": { "action": [ { "chatgpt-reasoning": "The description mentions that the man is initially looking at his watch and then raises his arm to look at the watch, with his facial expression changing from happy to anxious. This indicates that he is likely feeling anxious or worried about something.", "chatgpt-answer": "C. raising his arm to look at the watch looking anxious", "video-llm-prediction": "The video shows a man wearing a blue shirt who is seen looking at his watch. He then raises his arm to look at the watch, and his facial expression changes from happy to anxious. The man then puts his hands in his pockets, and his facial expression changes from happy to anxious. The video does not provide any context or information about the man or his surroundings.", "gt-answer": "C. raising his arm to look at the watch looking anxious", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man raises his arm to look at his watch and appears to be happy. Later, he puts his hands in his pockets and looks anxious. Therefore, the correct answer is A. raising his arm to look at the watch looking happy.", "chatgpt-answer": "A. raising his arm to look at the watch looking happy", "video-llm-prediction": "The video shows a man wearing a blue shirt who is looking at his watch. He raises his arm to look at the watch and appears to be happy. The man then puts his hands in his pockets and looks anxious. The video does not provide any additional information.", "gt-answer": "C. raising his arm to look at the watch looking anxious", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the man is seen raising his arm to look at his watch, and he appears to be happy initially. Then, the video shows him raising his arm again, but this time he looks anxious. Finally, the video shows the man putting his hands in his pockets, and he looks anxious.", "chatgpt-answer": "D. putting his hands in his pockets looking anxious", "video-llm-prediction": "A man is seen raising his arm to look at his watch, and he appears to be happy. The video then shows the same man raising his arm again, but this time he looks anxious. The video then shows the man putting his hands in his pockets, and he looks anxious.", "gt-answer": "C. raising his arm to look at the watch looking anxious", "rating": 0 }, { "chatgpt-reasoning": "The video description specifically mentions that the man is raising his arm to look at the watch and appears to be happy.", "chatgpt-answer": "A. raising his arm to look at the watch looking happy", "video-llm-prediction": "A man is seen wearing a blue shirt and looking at his watch. He raises his arm to look at the watch and appears to be happy. The video captures the man's actions and emotions as he interacts with his watch.", "gt-answer": "C. raising his arm to look at the watch looking anxious", "rating": 0 } ] }, "1050000214": { "action": [ { "chatgpt-reasoning": "The video description mentions that the little child is running towards a pool, jumping into it, swimming, and playing in the water. Therefore, the correct answer is B. Swimming.", "chatgpt-answer": "B. Swimming", "video-llm-prediction": "A little child is seen running towards a pool and then jumping into it. The child then swims towards the edge of the pool and jumps again. The child continues to swim and play in the water.", "gt-answer": "C. Water jumping", "rating": 0 }, { "chatgpt-reasoning": "The video description mentions that the little child is running towards the pool, jumping into the water, swimming, and dancing in the water. Therefore, the correct answer should be an action that encompasses all these activities.", "chatgpt-answer": "B. Swimming", "video-llm-prediction": "The video shows a little child wearing a yellow swimsuit who is seen running towards the pool, jumping into the water, and swimming. The child is also seen dancing in the water.", "gt-answer": "C. Water jumping", "rating": 0 }, { "chatgpt-reasoning": "The video description states that the little child is running towards a pool, then jumping into the water and swimming. The description also mentions that the child is seen dancing in the water. Based on this information, it can be concluded that the little child is performing multiple actions including running, jumping into water, swimming, and dancing.", "chatgpt-answer": "None of the choices are correct", "video-llm-prediction": "A little child is seen running towards a pool, then jumping into the water and swimming. The child is also seen dancing in the water.", "gt-answer": "C. Water jumping", "rating": 0 }, { "chatgpt-reasoning": "The video description explicitly mentions that the little child is running, swimming, jumping in the water, and dancing in the pool.", "chatgpt-answer": "A. Running, B. Swimming, C. Water jumping, D. Dancing", "video-llm-prediction": "The video shows a little child having fun in a pool. The child is seen running, swimming, and jumping in the water. The child also dances in the pool, adding to the joyful atmosphere. The video captures the child's playful and carefree nature, as they enjoy themselves in the water.", "gt-answer": "C. Water jumping", "rating": 0 } ] }, "27537016": { "order": [ { "chatgpt-reasoning": "The video description states that the man is sitting in a car, talking to the camera, and then proceeds to show off his car key. The final action mentioned is that he pulls back inside the car. Therefore, the correct sequence of events involving the man is showing off his car key then pulling back inside the car.", "chatgpt-answer": "A. showing off his car key then pulling back inside the car", "video-llm-prediction": "A man is seen sitting in a car and talking to the camera. He then proceeds to show off his car key and pulls back inside the car.", "gt-answer": "A. showing off his car key then pulling back inside the car", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man is first seen showing off his car key and then pulling back inside the car. After that, he throws away his car key and pulls back inside the car again. So the correct sequence of events involving the man is \"A. showing off his car key then pulling back inside the car\".", "chatgpt-answer": "A. showing off his car key then pulling back inside the car", "video-llm-prediction": "A man is seen inside a car, showing off his car key and then pulling back inside the car. He then throws away his car key and pulls back inside the car.", "gt-answer": "A. showing off his car key then pulling back inside the car", "rating": 1 }, { "chatgpt-reasoning": "The video description mentions that the man is first showing off his car key and then pulling back inside the car.", "chatgpt-answer": "A. showing off his car key then pulling back inside the car", "video-llm-prediction": "A man is seen inside a car, showing off his car key and then pulling back inside the car.", "gt-answer": "A. showing off his car key then pulling back inside the car", "rating": 1 }, { "chatgpt-reasoning": "The video description states that the man first shows off his car key and then pulls back inside the car. After that, he throws away his car key. Therefore, the correct sequence of events is A. showing off his car key then pulling back inside the car.", "chatgpt-answer": "A. showing off his car key then pulling back inside the car.", "video-llm-prediction": "A man is seen inside a car, showing off his car key and then pulling back inside the car. He then throws away his car key and pulls back inside the car.", "gt-answer": "A. showing off his car key then pulling back inside the car", "rating": 1 } ] } }, "yes_no": { "1034419625": { "action": [ { "question": "Is the man dunking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is dunking the activity that the man is engaged in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man performing the action of dunking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does dunking best describe the man's action?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man dribbling a basketball?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is dribbling a basketball the activity that the man is engaged in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is passing a basketball the action that the man is performing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the man moving from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the camera's point of view, is the man moving from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In relation to the camera's position, is the man headed from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man moving from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In the camera's point of view, is the man moving from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In relation to the camera's position, is the man headed from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1094590221": { "action": [ { "question": "Is the man shooting basketball?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is shooting basketball the main action of the man in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in shooting basketball?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man dunking basketball?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is passing basketball depicted in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, the video shows a man passing a basketball to another person.", "match_success": true, "rating": 0 }, { "question": "Is dribbling basketball being performed by the man?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Does the position of the basketball moving leftwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the position of the basketball moving rightwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098982673": { "action": [ { "question": "Is the woman dancing and singing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can we observe that the woman is dancing and singing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the video, is the woman involved in dancing and singing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman eating and singing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman involved in cooking meal?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In the video, is the woman jumping?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the speed of the video normal?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing at 1x real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video appear to be at real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video playing at 2x real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the video appear to be at fluctuating speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video running at rapid pace?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1111657885": { "action": [ { "question": "Are the people ice skating?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is ice skating the sport the people are engaged in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can ice skating be observed in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes, the video shows a person skating on an ice rink.", "match_success": true, "rating": 1 }, { "question": "Are the people performing the action of ice skating?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the action being performed by the individuals ice skating?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people skiing?", "gt-answer": "no", "video-llm-prediction": "No, the people are not skiing. They are playing a game of curling on an ice rink.", "match_success": true, "rating": 1 }, { "question": "Is tennis the sport the people are engaged in?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Can dancing be observed in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, the video shows a person dancing on the ice.", "match_success": true, "rating": 0 }, { "question": "Are the people performing the action of playing basketball?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is running the action being performed by the individuals?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the tempo of the video in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the entire video presented in slow motion?", "gt-answer": "yes", "video-llm-prediction": "No, the video is not entirely in slow motion. The first part of the video shows the man skating in slow motion, but the rest of the video shows the man skating at regular speed.", "match_success": true, "rating": 0 }, { "question": "Is the video playing in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tempo of the video at a rapid pace?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the entire video presented in fast forward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video playing in real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Are the people skating towards the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction that the people moving towards the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the movement of the people towards the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the people skating parallel to the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the people moving away in relation to the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the movement of the people away from the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1073873933": { "action": [ { "question": "Is there fighting happening in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes, there is fighting happening in the video. Two monkeys are seen fighting each other in the video.", "match_success": true, "rating": 1 }, { "question": "Is the monkey engaged in the activity of fighting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the main action of the monkey involve fighting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the monkey depict the action of fighting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the monkey participating in the activity of fighting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is there eating happening in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, there is eating happening in the video. One of the monkeys is seen eating grass in the video.", "match_success": true, "rating": 0 }, { "question": "Is the monkey engaged in the activity of swimming?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Does the main action of the monkey involve reading?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Does the monkey depict the action of singing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the monkey participating in the activity of fishing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1089810425": { "action": [ { "question": "Are the people dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the people about dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people performing dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the people about participating in dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people engaged in dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes, the people in the video are dancing in the water.", "match_success": true, "rating": 1 }, { "question": "Are the people cooking?", "gt-answer": "no", "video-llm-prediction": "No, the people are not cooking. They are playing in the water.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the people about swimming?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the people performing reading?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the people about running?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the people participating in knitting?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the speed of the video normal?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video played at real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the rate of the video moderate speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the tempo of the entire video fast?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the rate of the video low speed?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Is the panning direction in the video right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera movement in the video panning from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video shifting horizontally?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera moving leftward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the panning direction in the video left to right?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera movement in the video zooming in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video shifting vertically?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera moving rightward?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1077507593": { "action": [ { "question": "Are the people cooking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is cooking the activity that can be seen in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the individuals performing the action of cooking?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can you observe the people cooking in the footage?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the action of the people best described by the verb 'cooking'?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the people sleeping?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is reading the activity that can be seen in the video?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Are the individuals performing the action of writing?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Can you observe the people playing sports in the footage?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Does the action of the people best described by the verb 'talking'?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the speed of the video slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the events happening in the video at a slow rate?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the tempo of the video slow?", "gt-answer": "yes", "video-llm-prediction": "No, the video is not slow. The chef is seen adding oil to the pan and stirring it around quickly.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the video normal speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the events happening in the video at a fast rate?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the tempo of the video rapid tempo?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Does the skillet smoke before burning in fire?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is smoking the first event to happen to the skillet before burning?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does smoking occur before burning in fire for the skillet?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the skillet burn in fire before smoking?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is smoking the second event to happen to the skillet after burning?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the skillet smoke after burning in fire?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1107116885": { "action": [ { "question": "Is the man shooting an arrow?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man participating in archery?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is shooting an arrow being performed by the man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man shooting an arrow with the bow?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man involved in shooting an arrow in the given footage?", "gt-answer": "yes", "video-llm-prediction": "Yes. The man is shown shooting an arrow in the video.", "match_success": true, "rating": 1 }, { "question": "Is the man swimming?", "gt-answer": "no", "video-llm-prediction": "No, the man is not swimming. He is practicing archery in a field.", "match_success": true, "rating": 1 }, { "question": "Is the man participating in soccer?", "gt-answer": "no", "video-llm-prediction": "No, the man is not participating in soccer. He is practicing his archery skills in a field.", "match_success": true, "rating": 1 }, { "question": "Is dancing being performed by the man?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the man throwing the bow away?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the man involved in cooking in the given footage?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the pace of the video normal speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed setting applied to the entire video normal speed?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "Is the video presented at real-time tempo?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video playing with time-lapse effect?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed setting applied to the entire video slow motion?", "gt-answer": "no", "video-llm-prediction": "No, the speed setting is applied only to the man's actions and not to the entire video.", "match_success": true, "rating": 1 }, { "question": "Is the tempo of the video speeded-up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059718130": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pace at which the video is playing fast-forward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video progress at a rate of time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pace at which the video is playing slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the video progress at a rate of slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the sun rising?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the sun about rising?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is rising the primary movement of the sun?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun setting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sun making a circular motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is descending the primary movement of the sun?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the video's brightness turning brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the brightness increasing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the brightness of the entire video intensifying?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video brightening?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video getting darker?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the attribute of brightness remaining stable?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the brightness of the video fading away?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the brightness of the video remaining constant?", "gt-answer": "no", "video-llm-prediction": "Yes, the brightness of the video remains constant throughout the video.", "match_success": true, "rating": 0 } ] }, "1083845854": { "speed": [ { "question": "Is the video playing at time-lapse speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the word time-lapse describe the speed of the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is this a time-lapse video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing at slow motion speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video playing at normal speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video playing at fast-forward speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Are the clock hands moving clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the clock hands moving counterclockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1050618460": { "speed": [ { "question": "Is the speed of the entire video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the entire video have a fast-paced pace?", "gt-answer": "yes", "video-llm-prediction": "No. The video has a slow-paced pace, with the camera focusing on the flowers and their details.", "match_success": true, "rating": 0 }, { "question": "Does the entire video appear rapidly in terms of tempo?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video play in real-time tempo?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the entire video have a slow-paced speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video being presented at its natural speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Are the flowers turning into full bloom?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the flowers transform from bud to full bloom?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the flowers withering?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Do the flowers transform from full bloom to bud?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1083113449": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does this video showcase a time-lapse effect?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the time-lapse effect evident in this video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is slow motion the type of speed applied to the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the playback speed of the video equivalent to real-time?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the sky getting darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "What is occurring to the sky? Is it getting darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the sky getting brighter?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the sky maintaining its brightness?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1091143117": { "speed": [ { "question": "Does the video play at its original speed?", "gt-answer": "yes", "video-llm-prediction": "No. The video is sped up to show the movement of the contact lens.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the video playback in sync with real-time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pace of the video in real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video time-lapse?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the video have fast-forward velocity?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the video fast-paced?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the eye changing from closed to open?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the eye changing from open to closed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100329207": { "action": [ { "question": "Is the sheep running?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sheep engaged in running?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Can the action of the sheep be seen as running?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the activity showcased in the video involving the sheep about running?", "gt-answer": "yes", "video-llm-prediction": "No. The video does not show any sheep running.", "match_success": true, "rating": 0 }, { "question": "Is the sheep sleeping?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the sheep engaged in eating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can the action of the sheep be seen as eating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the activity showcased in the video involving the sheep about fighting?", "gt-answer": "no", "video-llm-prediction": "No. The video does not show any fighting among the sheep.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Is the direction of the camera view moving forward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video panning in the forward direction?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera movement directed towards moving forward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the direction of the camera view moving backward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video panning downwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera movement tilting up?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the video 1x real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video running in real-time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video play at the speed it was originally captured?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video fast forward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the rate at which the video is playing accelerated?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the tempo of the video paused?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1089201973": { "action": [ { "question": "Are the people kicking football?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the people performing the action of kicking football?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the people participating in the sport of kicking football?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people spinning football?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the people performing the action of stopping football?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the people participating in the sport of throwing football?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the speed of the video slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pace at which the video is playing slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "At what rate is the video being played, slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the term slow motion describe the tempo of the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the word slow motion best describe the velocity of the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video being displayed at the actual speed it was recorded?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the pace at which the video is playing rapid speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "At what rate is the video being played, fast speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the term high speed describe the tempo of the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the word time-lapse best describe the velocity of the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the football moving from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the football moving from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1034736653": { "action": [ { "question": "Are the woman athletes running?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is running the primary action of the woman athletes?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the woman athletes engaged in running?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the woman athletes cycling?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is reading the primary action of the woman athletes?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is singing the activity the woman athletes are engaged in?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the woman closest to the camera moving at the fastest speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Compared to the other people in the video, is the woman closest to the camera moving faster?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Among the individuals in the video, is the woman closest to the camera moving at the highest speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Compared to the other people in the video, is the woman closest to the camera moving at the slowest speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Among the individuals in the video, is the woman in the background moving at the highest speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In terms of speed, does the woman closest to the camera rank as the slowest?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Are the woman athletes running from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the woman athletes running from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098153561": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing in fast forward?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Does the tempo of the video accelerated?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video playing at a real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the rate at which the video is being played slow-paced?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Are the leaves changing color from green to yellow?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the initial color of the leaves green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the final color of the leaves yellow and red?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the leaves changing color from yellow to green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the initial color of the leaves yellow?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the final color of the leaves green?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1084153195": { "action": [ { "question": "Are the dolphins swimming in the water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can swimming activity be observed in the dolphins?", "gt-answer": "yes", "video-llm-prediction": "Yes, the dolphins can be seen swimming in the water.", "match_success": true, "rating": 1 }, { "question": "Is swimming the action of the dolphins in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the dolphins diving in the water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can dancing activity be observed in the dolphins?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is climbing the main action of the dolphins in the video?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Are the dolphins swimming towards the shore?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "In which direction are the dolphins swimming? Towards the shore?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the dolphins hovering in one place in the entire video?", "gt-answer": "no", "video-llm-prediction": "No. The dolphins are seen swimming in the water and interacting with each other throughout the video.", "match_success": true, "rating": 1 }, { "question": "Are the dolphins swimming away from the shore?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the video running in real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video play at the speed it was initially filmed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video exhibit standard speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can the velocity of the video be described as slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the video exhibit fast-forward speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video accelerated?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Do the dolphins swim towards the shore, followed by getting fed with fish?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is getting fed with fish happens after swimming towards the shore for the dolphins?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the dolphins swim towards the shore and then get fed with fish?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the dolphins get fed with fish before swimming towards the shore?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is getting fed with fish happens before swimming towards the shore for the dolphins?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Do the dolphins get fed with fish and then swim towards the shore?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1054717541": { "action": [ { "question": "Is the person kneading dough?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the action of the person about kneading dough?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the action demonstrated by the person about kneading dough?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person grilling dough?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the action of the person about cutting dough?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the action demonstrated by the person about throwing dough?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the video playing in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video have a tempo of slow playback?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the relative speed of the video slower compared to real-time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing at real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the tempo of the video playback fast?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the relative speed of the video faster compared to real-time?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1081092839": { "direction": [ { "question": "Is the direction of the sun descending?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the movement pattern of the sun falling?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the sun travel downwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the sun ascending?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the movement pattern of the sun rising?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the sun travel upwards during sunrise", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tempo of the video fast pace?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the video playing at time-lapse speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes, the video is in slow motion.", "match_success": true, "rating": 0 }, { "question": "Is the tempo of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video being presented at its natural speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059462749": { "action": [ { "question": "Is the person climbing down a ladder?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is climbing down a ladder the action being performed by the person?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is climbing down a ladder the main action of the person in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person reading a book?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is painting a picture the activity taking place with the person?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is playing basketball the main action of the person in the video?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Is the person moving downwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the word 'descending' describe the movement of the person?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person descending from a higher point to a lower point?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person moving upwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the word 'rising' describe the movement of the person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person ascending towards a higher point from a lower point?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the video playing at a regular speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video play at the speed it was originally captured?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video play in real-time tempo?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video playing in time-lapse?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video being played in an accelerated pace?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video running in high speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1077590324": { "action": [ { "question": "Is the woman doing laundry?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in the activity of doing laundry?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman performing the action of doing laundry?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman involved in the task of doing laundry?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman cooking?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not cooking. She is washing clothes in the sink.", "match_success": true, "rating": 1 }, { "question": "Is the woman dancing?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not dancing. She is washing clothes in the sink.", "match_success": true, "rating": 1 }, { "question": "Is the woman swimming?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not swimming. She is seen kneeling down in front of a washing machine and wiping it down.", "match_success": true, "rating": 1 }, { "question": "Is the woman knitting?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not knitting. She is washing clothes in the sink.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Does the video play at the speed it was initially filmed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the playback speed of the video equivalent to real-time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video being played in regular speed?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "Is the speed of the entire video slow motion?", "gt-answer": "no", "video-llm-prediction": "No, the video is not in slow motion. The woman is seen washing clothes in a sink, and the video is played at regular speed.", "match_success": true, "rating": 1 }, { "question": "Is the velocity of the video playback low speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video being played in rapid motion?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Is the woman putting clothes into the washing machine and then standing up to operate it?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is putting clothes into the washing machine and then turning it on the sequence of actions taken by the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman closing the door of the washing machine and then standing in front of it?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman sitting down to operate the washing machine and then putting clothes into it?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is turning off the washing machine and then getting dressed the sequence of actions taken by the woman?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the woman opening the door of the washing machine and then standing in front of it?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1040541401": { "action": [ { "question": "Are the children doing chemical experiments?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the children engaged in activities related to chemical experiments?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the main action performed by the children about doing chemical experiments?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the children participating in an activity that involves doing chemical experiments?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the children painting pictures?", "gt-answer": "no", "video-llm-prediction": "No, the children are not painting pictures. They are making a science experiment.", "match_success": true, "rating": 1 }, { "question": "Are the children engaged in activities related to reading books?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the main action performed by the children about playing soccer?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the speed of the video 1x real-time?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video play in real-time tempo?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video running at a real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video playing in time-lapse?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video playing very slow?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the video running at a rapid speed?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1059072773": { "attribute_change": [ { "question": "Is the ice cream melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice cream turning into liquid?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice cream freezing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the ice cream evaporating?", "gt-answer": "no", "video-llm-prediction": "Yes, the ice cream is evaporating.", "match_success": true, "rating": 0 } ] }, "1064645467": { "action": [ { "question": "Is the man exercising?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in doing exercise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man participating in exercising?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man cooking?", "gt-answer": "no", "video-llm-prediction": "No, the man is not cooking. He is seen standing in front of a pole and adjusting his tie.", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in reading a book?", "gt-answer": "no", "video-llm-prediction": "No, the man is not reading a book. He is adjusting his tie and looking at his phone.", "match_success": true, "rating": 1 }, { "question": "Is the man participating in watching TV?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the video being presented at its natural speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video playing at a normal speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video being displayed at the actual speed it was recorded?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video playing at a fast speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video playback rate accelerated speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Does the man take off his jacket before jumping up to grab the bar?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the man jump up to grab the bar after taking off his jacket?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the man take off his jacket and then jump up to grab the bar with his hands?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the man jump up to grab the bar before taking off his jacket?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the man jump up to grab the bar while taking off his jacket?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the man jump up to grab the bar and then take off his jacket?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1088279109": { "direction": [ { "question": "Is the elevator rising?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the elevator moving up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is ascending the direction of the elevator's movement?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the elevator going down?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is descending the direction of the elevator's movement?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the elevator stopped?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the speed of the video normal?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video being played in normal speed mode?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video play at the speed it was initially filmed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video being played in fast forward mode?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the video play at the speed of slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093573255": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video running at a rapid pace?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "Is the video being played at timelapse speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video normal speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video running sluggishly?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the video played at decelerated motion speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the plant reviving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the condition of the plant about reviving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the plant changing in a way that it is reviving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In what way is the plant transforming, is it reviving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the plant wilting?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the condition of the plant about withering?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the plant changing in a way that it is fading?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In what way is the plant transforming, is it deteriorating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1105233293": { "action": [ { "question": "Are the people playing basketball?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the people engaged in playing basketball?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is playing basketball the sport the people are participating in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the people swimming?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the people engaged in dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is football the sport the people are participating in?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the tempo of the video playback real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does real-time speed best characterize the speed of the entire video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the rate at which the video is progressing real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the tempo of the video playback freeze frame?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does decelerated motion best characterize the speed of the entire video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the rate at which the video is progressing slo-mo?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Are the players passing the ball to each other and then shooting the basketball?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is passing the ball to each other and shooting the basketball the correct order of events?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the sequence of events involve passing the ball to each other and then shooting the basketball?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the players shooting the basketball and then passing the ball to each other?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is shooting the basketball and blocking the opponent the sequence of actions performed by the players?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the correct order of events involve dribbling, shooting, passing the basketball?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1077146132": { "action": [ { "question": "Is the woman waking up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the action depicted in the video waking up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman falling asleep?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the woman tossing and turning in the bed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Does the sequence of events start with getting out of bed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does opening the curtains occur after getting out of bed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is opening the curtains the last event to occur?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Does the sequence of events start with closing the curtains?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does opening the curtains occur before getting into bed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the sequence of events end with getting out of bed, instead of opening the curtains?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "attribute_change": [ { "question": "Is the video turning brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video increasing in terms of brightness?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the light condition getting brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video turning darker?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video decreasing in terms of brightness?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the light condition getting dimmer?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086688682": { "attribute_change": [ { "question": "Are the traffic lights changing from red to green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the alteration taking place to the traffic lights transitioning from red to green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the traffic lights changing from yellow to red?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the alteration taking place to the traffic lights transitioning from green to red?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096612823": { "action": [ { "question": "Is the car driving on the road?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "What can be observed about the car's movement? Is it driving on the road?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In the scene, is the car driving on the road?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the car sliding on ice?", "gt-answer": "no", "video-llm-prediction": "No, the car is not sliding on ice. The video shows a car driving on a curvy road surrounded by trees.", "match_success": true, "rating": 1 }, { "question": "Is the car parked?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the car buried in the sand?", "gt-answer": "no", "video-llm-prediction": "No, the car is not buried in the sand. The video shows a car driving down a winding road surrounded by trees.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Is the video zooming in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is direction of movement zooming in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video changing by zooming in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video zooming out?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video rotating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video panning left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1075484900": { "direction": [ { "question": "Is the child turning away from the man?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the child turning towards the man?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1090578917": { "action": [ { "question": "Is the man playing soccer?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in playing soccer?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man participating in the sport of soccer?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man painting a picture?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the man dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the man participating in volleyball?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the man leaping to his right and then standing up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man standing up from the ground after leaping?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man leaping to his right before standing up in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man standing up and then leaping to his right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man standing up from the ground before leaping?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man leaping to his right after standing up in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the man leaping to his right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man moving towards the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man leaping to his left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man moving forwards?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1075338140": { "direction": [ { "question": "Is the ball rolling from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the ball moving in the direction of rolling from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the ball travel in the direction of rolling from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the ball spinning in place?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the ball moving counterclockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the ball rolling from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1067268403": { "direction": [ { "question": "Are the wind turbines rotating clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the wind turbines rotating counterclockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1072594556": { "speed": [ { "question": "Is the car in the center of the screen faster than other cars?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the car in the center of the screen move faster compared to other cars?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the car in the center of the screen slower than other cars?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the car in the center of the screen move slower compared to other cars?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1096007487": { "direction": [ { "question": "Is the 3d cloud spinning leftward from the camera's point of view?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the 3d cloud spinning leftward as seen from the camera's perspective?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the 3D cloud appear to be rotating leftward from the viewpoint of the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the 3d cloud spinning rightward from the camera's point of view?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the 3d cloud spinning upward from the camera's point of view?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the 3d cloud spinning downward from the camera's point of view?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1095939659": { "direction": [ { "question": "Is the light growing in a clockwise direction?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the direction of the light's movement anticlockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059632327": { "direction": [ { "question": "Is the direction of the tennis ball bouncing up and down?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the tennis ball bouncing left and right?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098785169": { "direction": [ { "question": "Is the direction of the galaxy's spin clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the galaxy's spin counterclockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099984801": { "direction": [ { "question": "Are the clouds moving towards the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the clouds moving away from the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video set to time-lapse speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video have an accelerating pacing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video set to real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the video have a decelerating pacing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the entire video getting darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the entire video turning brighter?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1082419672": { "direction": [ { "question": "Is the direction of movement in the video flying backwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the entire video moving backwards relative to the ship?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of movement in the video flying forwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the entire video moving forwards relative to the ship?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1058985719": { "direction": [ { "question": "Is the airplane flying from bottom to top?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the airplane moving upwards on the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the airplane flying from top to bottom?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the airplane moving downwards on the screen?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055413730": { "direction": [ { "question": "Is the planet Earth spinning rightwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "According to the camera's perspective, is the rotational movement of the planet Earth spinning to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Based on the camera's viewpoint, is the apparent motion of the Earth spinning to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the planet Earth spinning leftwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "According to the camera's perspective, is the rotational movement of the planet Earth rotating upward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Based on the camera's viewpoint, is the apparent motion of the Earth a complete stop?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1081684532": { "direction": [ { "question": "Are the asteroids flying towards the camera?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Are the asteroids flying away from the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "23391142": { "action": [ { "question": "Are the people playing badminton?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is playing badminton happening in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the people playing tennis?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the video panning to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the movement of the video about panning to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the scene shifting to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video panning to the left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the movement of the video about zooming in?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the scene shifting to the bottom?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the video playing in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video playing at real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1078368947": { "action": [ { "question": "Is the woman reading a book in the bathroom?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in reading a book?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is reading a book while taking a bath describes the woman's action?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman washing her hair while taking a bath?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is taking a shower describes the woman's activity?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is washing her face while taking a bath describes the woman's action?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1099738787": { "attribute_change": [ { "question": "Is the concrete wall falling apart?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the concrete wall changing by falling apart?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the concrete wall growing taller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the concrete wall assembling together?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1094219575": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video use time-lapse speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video play in real-time tempo?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the video use slow motion speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Are the flowers wilting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the condition of the flowers decaying?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the transformation occurring to the flowers fading away?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the flowers growing taller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the flowers blooming", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the transformation occurring to the flowers sprouting new buds?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1053758117": { "direction": [ { "question": "Is the camera zooming into a 3D digital brain?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving in the video by zooming in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera standing still before a 3D digital brain?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera zooming out in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1069717165": { "order": [ { "question": "Does the woman nod her head after shaking it?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the woman nod her head and then shake it?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1041584314": { "order": [ { "question": "Does the man show a serious expression and then smile?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "After showing a serious expression, does the man start to smile?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the man's facial expressions change from serious to smiling over time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the man show a serious expression after smiling?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Before showing a serious expression, does the man start to smile?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the man's facial expressions change from smiling to serious over time?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067427023": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing in time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video progressing by being sped up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the playback speed of the video equivalent to real-time?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video playing in slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video progressing in real-time?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Are the snow particles melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the primary attribute change experienced by the snow particles melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the snow particles solidifying?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is scattering the primary attribute change experienced by the snow particles?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1093948229": { "attribute_change": [ { "question": "Are the golden particles exploding?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the change in the attribute of the golden particles involve exploding?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the transformation taking place on the golden particles represented by exploding?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the golden particles disappearing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is shrinking the best word that represents the change in the attribute of the golden particles?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is contracting the best word that represents the transformation taking place on the golden particles?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1106668103": { "direction": [ { "question": "Is the direction of movement in the video moving forward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the primary motion depicted in the video about moving forward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the primary trajectory in the video involve moving forward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of movement in the video moving backward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the primary motion depicted in the video about moving leftward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the primary trajectory in the video involve moving right ward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1049965795": { "attribute_change": [ { "question": "Is the light bulb lighting up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "What is happening to the light bulb? Is it lighting up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is lighting up the alteration that takes place in the light bulb?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the light bulb turning off?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "What change occurs in the light bulb? Is it getting darker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is turning off the alteration that takes place in the light bulb?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1052364490": { "attribute_change": [ { "question": "Is the digital bar chart growing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the digital bar chart decreasing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1080990179": { "attribute_change": [ { "question": "Is the apple shrinking and drying out?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the apple getting smaller?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is shrinking and drying out the change in the apple's attributes?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the apple ripening?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the apple becoming juicier?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is getting bigger and softer the change in the apple's attributes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1057163434": { "direction": [ { "question": "Is the chef putting the bread on top of the burger?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the chef removing the bread from the burger?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1085910917": { "action": [ { "question": "Is the woman drinking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the woman about drinking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is drinking the action performed by the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman sleeping?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not sleeping. She is drinking water from a glass.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the woman about running?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is reading the action performed by the woman?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "order": [ { "question": "Does the video show the events occurring in the sequence of drinking a glass of water and then turning back?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video show the events occurring in the sequence of turning back and then drinking a glass of water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1058907236": { "action": [ { "question": "Is the squirrel foraging?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the squirrel performing the action of foraging for nuts?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the squirrel sleeping?", "gt-answer": "no", "video-llm-prediction": "No, the squirrel is not sleeping. It is eating nuts and looking around.", "match_success": true, "rating": 1 }, { "question": "Is building a nest the main activity of the squirrel?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Does the sequence of events involve the squirrel first picking up a nut and then turning back?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the sequence of events involve the squirrel first turning back and then picking up a nut?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1077575504": { "attribute_change": [ { "question": "Is the pile of salt growing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the attribute change happening to the pile of salt about growing?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the pile of salt changing by growing bigger?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt shrinking?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the attribute change happening to the pile of salt about getting smaller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pile of salt changing by vanishing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "23370985": { "attribute_change": [ { "question": "Is the ice crystal freezing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the process occurring with the ice crystal forming?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the transformation taking place in the ice crystal forming?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice crystal melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the process occurring with the ice crystal reducing in size?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the transformation taking place in the ice crystal melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100319395": { "direction": [ { "question": "Is the circular pattern moving clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the circular pattern spinning clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the circular pattern spinning in the clockwise direction?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the circular pattern moving counter-clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the circular pattern spinning counter-clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the circular pattern spinning in the anticlockwise direction?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067268406": { "speed": [ { "question": "Is the car faster than the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the car's speed faster than camera's speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the car move at a faster speed compared to the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the car slower than the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the car's speed slower than camera's speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the car move at a slower speed compared to the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1092682551": { "speed": [ { "question": "Do the cars travel slower than the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the cars slower than the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it true that the cars move at a slower speed compared to the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the cars travel at the same speed as the camera?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the cars faster than the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does it mean that the cars move faster compared to the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1101200293": { "direction": [ { "question": "Is the camera motion relative to the aircraft carrier clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera motion relative to the aircraft carrier counterclockwise?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1072453637": { "direction": [ { "question": "Is the camera panning to the back of a fighter jet?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera panning to the front around a fighter jet?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Did the fighter jet shoot one missile first and then shoot two missiles?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Did the fighter jet shoot two missiles after shooting one missile?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Did the fighter jet shoot three missiles first and then shoot four missiles?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Did the fighter jet shoot one missile after shooting two missiles?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3396473605": { "direction": [ { "question": "Do the five stars appear from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the five stars disappear from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086820415": { "direction": [ { "question": "Is the large wave moving vertically towards the bottom of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the large wave move in the direction towards the bottom of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is moving vertically towards the bottom the direction of motion of the large wave?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the large wave moving horizontally towards the right side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the large wave move in the direction towards the top of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is moving vertically towards the top the direction of motion of the large wave?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1081513610": { "action": [ { "question": "Is the man discussing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man performing the action of discussing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is discussing the primary activity of the man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man swimming?", "gt-answer": "no", "video-llm-prediction": "No, the man is not swimming. He is sitting at a table with a laptop and writing on a piece of paper.", "match_success": true, "rating": 1 }, { "question": "Is the man performing the action of reading?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is cooking the primary activity of the man?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1073831006": { "action": [ { "question": "Are the zebras running?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the zebras performing the action of running?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can we see the zebras running in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes, we can see the zebras running in the video.", "match_success": true, "rating": 1 }, { "question": "Are the zebras sleeping?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the zebras performing the action of walking?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Can we see the zebras eating in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, the video shows the zebras eating in the field.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Are the zebras moving from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the zebras moving from left to right relative to the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the zebras heading rightward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the zebras moving from right to left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the zebras moving away from the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the zebras heading downward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Are the zebras moving in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video show the zebras at a slowe-motion speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the zebras stationary?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the video playing at real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the video play in fast motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1069338034": { "action": [ { "question": "Are the elephants eating and drinking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is eating and drinking observed in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes, the video shows the elephants eating and drinking in the river.", "match_success": true, "rating": 1 }, { "question": "Are the elephants engaged in eating and drinking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the elephants swimming and drinking?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is swimming and taking bath observed in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, the video shows the elephants swimming and taking bath in the river.", "match_success": true, "rating": 0 }, { "question": "Are the elephants engaged in swimming and cleaning themselves?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1076880707": { "action": [ { "question": "Is the bear scratching against a tree?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the bear engaged in the activity of scratching against a tree?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is scratching against a tree the action seen in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the bear eating honey?", "gt-answer": "no", "video-llm-prediction": "No, the bear is not eating honey. It is seen rubbing its head against a tree and scratching its back against the tree.", "match_success": true, "rating": 1 }, { "question": "Is the bear engaged in the activity of climbing a tree?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is sleeping against the tree the action seen in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1092278063": { "direction": [ { "question": "Are the two rows of duck toy moving in opposite directions on a conveyor belt?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the two rows of duck toy moving relative to each other opposite on a conveyor belt?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the two rows of duck toy moving in the same direction on a conveyor belt?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the direction of the two rows of duck toy moving relative to each other in the same direction?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is this video played at a real-time speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is this video played at a extreme slow-motion speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1024867412": { "action": [ { "question": "Is the dog driving a car?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the dog engaged in driving a car?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is driving a car the action the dog is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the dog eating?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the dog engaged in reading a book?", "gt-answer": "no", "video-llm-prediction": "No, the dog is not engaged in reading a book. The video shows the dog sitting in the car and looking out the window.", "match_success": true, "rating": 1 }, { "question": "Is the dog performing the action of painting?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Is the car taking a right turn?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the car moving in the right direction?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is making a right turn the maneuver the car is making?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the car driving straight in the entire video?", "gt-answer": "no", "video-llm-prediction": "Yes, the car is driving straight in the entire video.", "match_success": true, "rating": 0 }, { "question": "Is the car moving to the left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is making a left turn the maneuver the car is making?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1076877854": { "action": [ { "question": "Are the robots caring for seedlings?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the robots performing the task of caring for seedlings?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the robots engaged in the action of caring for seedlings?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the robots watering plants?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the robots performing the task of building houses?", "gt-answer": "no", "video-llm-prediction": "No, the robots are not building houses. They are performing the task of planting seeds in the soil.", "match_success": true, "rating": 1 }, { "question": "Are the robots engaged in the action of playing chess?", "gt-answer": "no", "video-llm-prediction": "No, the robots are not engaged in playing chess. They are simply watering the plants in the field.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Is the closest robotic arm moving to the right side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can the closest robotic arm be observed moving to the right side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the closest robotic arm exhibit movement to the right side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the closest robotic arm moving towards the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can the closest robotic arm be observed moving to the left side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the closest robotic arm sway back and forth?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1104673225": { "action": [ { "question": "Is the woman eating salad?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in eating salad?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is eating salad the action the woman is involved in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman wrapping up salad?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the woman involved in drinking vegetable juice?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is making salad the action the woman is involved in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100468035": { "direction": [ { "question": "Is the camera zooming forward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving towards zooming forward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the camera show zooming forward movement?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera zooming backward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera tracking right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the camera panning left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the door gradually opening?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the door changing by gradually opening?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the change of the door best described as opening?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the door remaining closed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the door changing by gradually closing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the door gradually closing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "315784": { "speed": [ { "question": "Is the speedometer in the center moving faster than the one on the left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the relative speed of the speedometer in the center faster compared to the speedometer on the left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speedometer in the center move at a faster speed compared to the one on the left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speedometer in the center stationary?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the relative speed of the speedometer in the center slower compared to the speedometer on the left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the speedometer in the center move at a slower speed compared to the one on the left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3411806181": { "action": [ { "question": "Is the person recharging an electric vehicle?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person engaged in the activity of recharging an EV?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is recharging an electric vehicle one of the actions that the person is involved in?", "gt-answer": "yes", "video-llm-prediction": "Yes. The person is seen recharging an electric vehicle with a portable charger.", "match_success": true, "rating": 1 }, { "question": "Is the person cleaning an electric vehicle?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the person repairing an electric vehicle?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is driving an electric vehicle the action that the person is involved in?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the person moving the charging gun towards the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person performing the action of plugging the charging gun into the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving the charging gun towards the side of the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving the charging gun away from the car?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person unplugging the charging gun from the car?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person moving the charging gun towards himself?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the video playing in slow motion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video playing in time-lapse?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1043054206": { "speed": [ { "question": "Is the yellow car driving faster than other cars?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can you describe the speed of the yellow car as faster compared to other cars?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the yellow car moving faster than other cars?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the yellow car stopped?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the yellow car driving at the same speed as other cars?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the yellow car driving slower than other cars?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1096238125": { "action": [ { "question": "Are the man and woman lifting weights?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the man and woman about lifting kettlebell?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the man and woman engaged in lifting kettlebell?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the man and woman doing sit-ups?", "gt-answer": "no", "video-llm-prediction": "No, the man and woman are not doing sit-ups. They are performing a weightlifting exercise.", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the man and woman about jumping ropes?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the man and woman engaged in doing push-ups?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Is the man lifting the kettlebell at roughly the same speed as the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In terms of speed, does the man compare to the woman while lifting the kettlebell approximately the same?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the man relative to the woman while lifting the kettlebell same?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man lifting the kettlebell at a much slower pace than the woman?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In terms of speed, is the man significantly faster than the woman while lifting the kettlebell?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the man lift the kettlebell much slower than the woman?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1103088481": { "action": [ { "question": "Is the person buying vegetables in the market?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person engaged in the activity of buying vegetables at the grocery store?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is buying vegetables what the individual is doing in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person selling vegetables in the market?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the person cooking vegetables at the grocery store?", "gt-answer": "no", "video-llm-prediction": "No, the person is not cooking vegetables at the grocery store. The video shows the person pushing a shopping cart down an aisle and looking at the produce section.", "match_success": true, "rating": 1 }, { "question": "Is eating vegetables what the individual is doing in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the correct order of events in the video placing a green vegetable into the trolley and then placing a black vegetable into the trolley?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person picking up a green vegetable before picking up a black vegetable?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the correct order of events in the video placing a black vegetable into the trolley and then placing a green vegetable into the trolley?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person picking up a green vegetable after picking up a black vegetable?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055981522": { "attribute_change": [ { "question": "Are the 3d shapes turning into spheres?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3d shapes changing from cubes into spheres?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3d shapes turning into cubes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the 3d shapes changing from sphere into cubes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1061017846": { "speed": [ { "question": "Is the boat on the top of the screen traveling at the same speed as the boat on the bottom of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the two boats in the video travel at the same speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the boat on the top of the screen significantly slower than the boat on the bottom of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the two boats in the video travel at significantly different speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1097341567": { "order": [ { "question": "Do the bars appear before the arrow in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the arrow appear after the bars in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the bars and the arrow appear at the same time in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the arrow appear before the bars in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1056433484": { "direction": [ { "question": "Is the direction of the Earth's motion around the Sun counter-clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the Earth travel in a counter-clockwise direction in its orbit around the Sun?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the Earth's rotation in relation to the Sun follow a counter-clockwise direction?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the Earth's motion around the Sun clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the Earth travel in a clockwise direction in its orbit around the Sun?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the Earth's rotation in relation to the Sun follow a anti-clockwise direction?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Does the earth rotate faster than the sun?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the earth's speed compared to the sun faster?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the earth rotate faster than the sun in terms of speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the earth rotate slower than the sun?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the earth's speed compared to the sun slower?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the sun rotate faster than the earth in terms of speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1073914229": { "direction": [ { "question": "Do the trains travel towards each other?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the trains travel away from each other?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099360359": { "speed": [ { "question": "Does the train further away from the screen drive faster?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the relative speed between the two trains about the train further away from the screen driving faster?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "According to the video, does the train further away from the screen have a higher speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the train closer to the screen drive faster?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the relative speed between the two trains about the train closer to the screen driving faster?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "According to the video, does the train closer to the screen have a higher speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098970151": { "action": [ { "question": "Is the cat licking its paw?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video focused on a cat licking its paws?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the cat licking its paws with its tongue?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the cat waving its paw?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video focused on a cat watching its paw?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the cat licking another cat?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1081734740": { "attribute_change": [ { "question": "Is the texture of the leaf turning from green to yellow?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the leaf turning into yellow color?", "gt-answer": "yes", "video-llm-prediction": "Yes, the leaf is turning into yellow color.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring in the leaf that it is becoming yellow?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the texture of the leaf turning from yellow to green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the leaf turning into green color?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring in the leaf that it is getting greener?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1093719871": { "attribute_change": [ { "question": "Are the pink flowers turning from withered to full blossom?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the pink flowers become fully bloomed in the end?", "gt-answer": "yes", "video-llm-prediction": "Yes, the pink flowers become fully bloomed in the end.", "match_success": true, "rating": 1 }, { "question": "Are the pink flowers falling off petals?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the pink flowers turning from full blossom to withered?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1042819039": { "speed": [ { "question": "Is the speed of the video time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pace at which the video is playing about time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video being shown in time-lapse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the video slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pace at which the video is playing about real-time speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video being shown in slow motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Did the street get filled with people before getting filled with vehicles?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the events occur in the order of the street getting filled with people, then vehicles?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the street get filled with vehicles before getting filled with people?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Did the events occur in the order of the street getting filled with vehicles, then people?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093139559": { "direction": [ { "question": "Is the camera moving in the direction of zooming in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does zooming forward best describe the camera's motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving in the direction of zooming out?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is tilting upwards the best description of the camera's motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Are the light conditions on the football players turning brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is it accurate to say that the football players are becoming more visible?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the light conditions on the football players staying the same?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is it accurate to say that the football players are becoming dimmer?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055973887": { "attribute_change": [ { "question": "Is the fire ball getting larger?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the fire ball changing its size and shape?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is growing in size the way the fire ball is transforming?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the fire ball staying the same size?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is getting smaller the way the fire ball is transforming?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is shrinking in size the way the fire ball is transforming?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1098710341": { "action": [ { "question": "Is the person pouring water into a glass?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person performing the action of pouring water into a glass?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is pouring water into a glass the action being performed by the person?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person drinking water from a glass?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person stirring water in a bowl?", "gt-answer": "no", "video-llm-prediction": "No, the person is not stirring water in a bowl. The video shows a person pouring water into a glass and stirring it with a spoon.", "match_success": true, "rating": 1 }, { "question": "Is washing hands with water the action being performed by the person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the glass going from empty to full of water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is there water in the glass in the final of video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the glass going from full of water to empty?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the final state of the glass empty?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1062736174": { "action": [ { "question": "Is the chef sprinkling salt on the steak?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the chef performing the action of sprinkling salt on the steak?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the chef chopping steak?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the chef pouring water on the steak?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099116143": { "attribute_change": [ { "question": "Is white foam appearing on the surface of the pink liquid?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can the visual observation of the pink liquid include white foam appearing on the surface?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is white foam disappearing from the surface of the pink liquid?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the pink liquid become green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1108398787": { "action": [ { "question": "Is this video about operating system settings on a smartphone device?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is operating system settings the activity the video is presenting?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is this video about chatting on a smartphone device?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is watching videos on a smartphone device the activity the video is presenting? ", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the person scrolling down and then entering passwords?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the events occurring in the order of scrolling down and then entering passwords?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person performing the actions by scrolling down and then entering passwords?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person entering passwords and then scrolling down?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the events occurring in the order of entering passwords and then scrolling up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person performing the actions by scrolling up and then entering passwords?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1080591311": { "direction": [ { "question": "Is the jellyfish floating upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of motion for the jellyfish upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is going up the way the jellyfish is moving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the jellyfish moving towards the right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is floating to the left the direction of motion for the jellyfish?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is going down the way the jellyfish is moving?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1107034223": { "action": [ { "question": "Is the bear catching fishes in the river?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the bear engaged in fishing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is catching fishes the main action of the bear?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the bear swimming in the river?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the bear drinking?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is climbing rocks the main action of the bear?", "gt-answer": "no", "video-llm-prediction": "No. The main action of the bear is catching and eating a fish in the water.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Is the bear catching a fish and then turning back?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the bear turning back and then catching a fish?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1025623079": { "attribute_change": [ { "question": "Is the skyscraper collapsing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring with the skyscraper about collapsing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the skyscraper growing taller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring with the skyscraper being eracted?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1094782389": { "action": [ { "question": "Is the dog giving a high five to a woman?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the dog engaged in giving a high five to a woman?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the dog execute the action of giving a high five to a woman?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the dog running towards a woman?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the dog catching food from a woman?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Did the dog lick the woman?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3411228673": { "direction": [ { "question": "Is the direction of the movement in the video upwards among skyscraper buildings?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the path of movement in the video flying upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera moving downwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the path of movement in the video flying backwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1043487715": { "action": [ { "question": "Are the children diving into water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the activity involving the children in the video about diving into water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is diving into water the primary action performed by the children?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the children eating?", "gt-answer": "no", "video-llm-prediction": "No, the children are not eating. They are swimming and playing in the pool.", "match_success": true, "rating": 1 }, { "question": "Is the activity involving the children in the video about hiking?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is cooking the primary action performed by the children?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Are the children diving into water and then making gestures to the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the children making gestures to the camera after diving into water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is diving into water followed by making gestures to the camera in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the children making gestures to the camera and then diving into water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the children leaving the swimming pool and then making gestures to the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is making gestures to the camera followed by diving into water in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093737353": { "direction": [ { "question": "Is the camera panning to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the direction of the camera's movement rightwards?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera panning to the left?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the direction of the camera's movement downwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the order that the equipments are shown in the video a line of test tubes and then a beaker?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the test tubes shown before the beaker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the beaker shown after the test tubes?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order that the equipments are shown in the video a beaker and then a line of test tubes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the test tubes shown after the beaker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the beaker shown before the test tubes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1063373449": { "attribute_change": [ { "question": "Is the coronavirus dissolving under the attack of antibodies?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the coronavirus assembling together", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1017768724": { "direction": [ { "question": "Is the person moving rightwards?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person turning rightwards?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person rotating to the right?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving leftwards?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person turning upwards?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person moving downwards?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1106280325": { "action": [ { "question": "Is the woman reading a book?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in the activity of reading a book?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can a woman be seen reading a book on the grass in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman hiking?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not hiking. She is laying on the ground and reading a book.", "match_success": true, "rating": 1 }, { "question": "Is the woman playing guitar?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not playing guitar. She is reading a book and looking at the camera.", "match_success": true, "rating": 1 }, { "question": "Is the woman sleeping?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Does a girl appear before the body of water in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a body of water shown after a girl reading a book in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a body of water shown before a girl reading a book in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does a girl appear after the body of water in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100117263": { "direction": [ { "question": "Is the little lion's motion downward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the little lion falling from the back of an adult lion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the little lion going in the direction of falling down?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the little lion's motion upward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the little lion climbing to the back of an adult lion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the little lion climbing up?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "15695290": { "action": [ { "question": "Is the person drawing a picture?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the activity of the person about drawing a picture?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is drawing a picture the main task of the person?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person playing soccer?", "gt-answer": "no", "video-llm-prediction": "No, the person is not playing soccer. They are drawing a house and people on a piece of paper.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the person about dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is typing on the computer the main task of the person?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "order": [ { "question": "Is a house being drawn before a family of people in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the house being drawn first, and then the family of people in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a house is being drawn first and then a family of people?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a family of people being drawn before a house in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the family of people being drawn first, and then the house in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video that a family of people is being drawn first and then a house?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1091090295": { "order": [ { "question": "Does the bird fly onto the back of the hippo first, then a hippo pokes its head out of water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a bird flying onto the back of a hippo happen before a hippo pokes its head out of water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a hippo put its head into water before a bird flying onto the back of a hippo?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does a hippo poking its head out of water happen before a bird flying onto the back of a hippo?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1021488277": { "direction": [ { "question": "Is a person picking up the pineapple?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pineapple being picked up by a person?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can an individual be observed lifting the pineapple?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a person dropping down the pineapple?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pineapple being rotated by a person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the pineapple being pushed forward by a person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1106899445": { "action": [ { "question": "Is the person squeezing out toothpaste on the toothbrush?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the main action of the person in the video about squeezing out toothpaste on a toothbrush?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is toothpaste being squeezed on a toothbrush what happens in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person brushing teeth using the toothbrush?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is removing toothpaste from the toothbrush the main action of the person in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is toothpaste being washed from a toothbrush what happens in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067925569": { "order": [ { "question": "Is the order of events in the video first a container ship is shown and then a cargo train is shown?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the events presented in the video in the sequence of first a container ship is shown and secondly a cargo train is shown?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a cargo train come after a container ship in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video first a cargo train is shown and then a container ship is shown?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the events presented in the video in the sequence of first a cargo train is shown and secondly a container ship is shown?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does a container ship come after a cargo train in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1062609286": { "attribute_change": [ { "question": "Is the battery charge increasing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the battery charge describe a rise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the battery charge decreasing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the battery charge staying constant?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100397435": { "action": [ { "question": "Is the person in the video starting the robot vacuum cleaner?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the robot vacuum cleaner being turned on?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person turning off the robot vacuum cleaner?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person in the video fixing the robot vacuum cleaner?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the robot vacuum cleaner moving to the right side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the movement pattern of the robot vacuum cleaner a straight line to the right side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the robot vacuum cleaner heading to the right side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the robot vacuum cleaner moving to the left side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "IIs the robot vacuum cleaner moving to the bottom side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the robot vacuum cleaner heading to the upper side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Does the person enter the screen first and then the robot vacuum cleaner starts moving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a person enter the screen before the robot vacuum cleaner starts moving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the first event in the video about a person entering the screen and then the robot vacuum cleaner starts moving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the robot vacuum cleaner start moving first and then a person enters the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the robot vacuum cleaner start moving before a person enters the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the first event in the video about the robot vacuum cleaner starting to move and then a person enters the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1108534143": { "direction": [ { "question": "Is the puppy walking out of a wigwam?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the puppy's movement walking out of a wigwam?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is walking out of a wigwam the action the puppy is taking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the puppy staying in a wigwam without going out?", "gt-answer": "no", "video-llm-prediction": "No. The puppy is seen walking around the wigwam and going outside to play.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the puppy's movement entering a wigwam?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is walking around a wigwam the action the puppy is taking?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1034049020": { "action": [ { "question": "Is the woman painting a wall while walking?", "gt-answer": "yes", "video-llm-prediction": "Yes, the woman is painting a wall while walking.", "match_success": true, "rating": 1 }, { "question": "Is the activity in the video about painting a wall while walking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is painting a wall while walking the action the woman is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman cleaning a wall while walking?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the activity in the video about standing still and painting a wall?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is standing and cleaning a wall the action the woman is performing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the order of events Painting a wall while walking, then turning back?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the events occurring in the order of Painting a wall while walking, then turning back?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the woman turn back after painting a wall while walking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events Turning back and painting the wall, then walking?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the events occurring in the order of Turning back first and later painting a wall while walking?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the woman sit down after painting a wall?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1047368344": { "direction": [ { "question": "Is the girl jumping into water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In which direction is the girl moving? Is it towards the water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the girl jumping out of water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In which direction is the girl moving? Is it away from the water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the girl taking off clothes and then jumping into water?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Does the girl take off clothes before jumping into water?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the sequence of actions performed by the girl: taking off clothes, putting on clothes, jumping into water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the girl jumping into water and then putting on clothes?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the girl jump into water before taking off clothes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the sequence of actions performed by the girl: putting on clothes, jumping into water, taking off clothes?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1060403198": { "attribute_change": [ { "question": "Is the tree increasing its height?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tree undergoing a transformation of growing up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can we use the term 'growing' to describe the change happening to the tree?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the tree decreasing its height?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the tree undergoing a transformation of becoming shorter?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can we use the term 'falling down' to describe the change happening to the tree?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100074677": { "order": [ { "question": "Did the person write something on the paper note and then stand it up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the person arrange the actions by writing something on the paper note and then standing it up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the person stands up the paper note and then write something on it?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Did the person arrange the actions by standing the paper note up and then writing something on it?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100350201": { "order": [ { "question": "Is the little girl drawn before the man in the video?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Does the drawing of the little girl occur before the drawing of the man in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that the little girl is drawn first and then the man is drawn?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man drawn before the little girl in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the drawing of the man occur before the drawing of the little girl in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video that the man is drawn first and then the little girl is drawn?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1099109715": { "attribute_change": [ { "question": "Is the number of fruits and vegetables increasing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the change to the fruits and vegetables about increasing number?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it accurate to say that the number of fruits and vegetables is getting bigger?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the number of fruits and vegetables becoming smaller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change to the fruits and vegetables about disappearing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is it accurate to say that the number of fruits and vegetables is getting smaller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1051211272": { "attribute_change": [ { "question": "Is the toast with cream cheese gradually being eaten out and disappearing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the toast with cream cheese disappear completely in the final?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the toast with cream cheese getting bigger?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the toast with cream cheese grow in size?", "gt-answer": "no", "video-llm-prediction": "Yes, the toast with cream cheese grows in size as the tomato is added to it.", "match_success": true, "rating": 0 } ] }, "1059815936": { "attribute_change": [ { "question": "Is the paper changing from a wrinkled paper ball into a flattened sheet?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the paper unfolding?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the main change occurring in the paper changing from a wrinkled paper ball into a flattened sheet?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the paper changing from a flattened sheet into a wrinkled paper ball?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the paper tearing apart?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the paper crumpling into a ball?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086423566": { "order": [ { "question": "Is food added into the bowl and then the bowl rotates?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In what sequence do the events occur in the video: food added into the bowl and then the bowl rotates?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is this the correct order of actions: food added into the bowl and then the bowl rotates?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the bowl rotating before adding food into it?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In what sequence do the events occur in the video: food added into the bowl after the bowl rotates?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is this the correct order of actions: the bowl rotates and then food added into the bowl?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1069611487": { "order": [ { "question": "Did the video show a pizza box appearing and then pizza slices being taken away?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the video show pizza slices being taken away after a pizza box appeared?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Did the events in the video occur in the order: a paper box appears, then pizza slices disappear?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the video show pizza slices disappearing before a pizza box appeared?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Did the video show a paper box appearing as the last event?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Did the events in the video occur in the order: pizza slices appear, then a paper box appears?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1034419625_reverse": { "direction": [ { "question": "Is the man moving from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the camera's point of view, is the man moving from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In relation to the camera's position, is the man headed from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man moving from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In the camera's point of view, is the man moving from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In relation to the camera's position, is the man headed from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1094590221_reverse": { "direction": [ { "question": "Does the position of the basketball moving rightwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the position of the basketball moving leftwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1111657885_reverse": { "direction": [ { "question": "Are the people skating towards the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the direction that the people moving towards the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the movement of the people towards the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the people skating away from the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people moving away in relation to the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the movement of the people away from the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 } ] }, "1089810425_reverse": { "direction": [ { "question": "Is the panning direction in the video left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera movement in the video panning from left to right?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video shifting horizontally?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera moving rightward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the panning direction in the video right to left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera movement in the video zooming in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video shifting vertically?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera moving leftward?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059718130_reverse": { "direction": [ { "question": "Is the sun falling?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the direction of the sun about falling?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is falling the primary movement of the sun?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun rising?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sun making a circular motion?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is ascending the primary movement of the sun?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the video's brightness turning darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the brightness decreasing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the brightness of the entire video fading away?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video darkening?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video getting brighter?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the attribute of brightness remaining stable?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the brightness of the video intensifying?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the brightness of the video remaining constant?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1083845854_reverse": { "direction": [ { "question": "Are the clock hands moving counterclockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the clock hands moving clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100329207_reverse": { "direction": [ { "question": "Is the direction of the camera view moving backward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video panning in the backward direction?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera movement directed towards moving backward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the camera view moving forward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video panning downwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera movement tilting up?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1089201973_reverse": { "direction": [ { "question": "Is the football moving from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the football moving from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1034736653_reverse": { "direction": [ { "question": "Are the woman athletes running from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the woman athletes running from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1084153195_reverse": { "direction": [ { "question": "Are the dolphins swimming away from the shore?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In which direction are the dolphins swimming? Away from the shore?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the dolphins hovering in one place in the entire video?", "gt-answer": "no", "video-llm-prediction": "No. The dolphins are seen swimming in the water and changing positions throughout the video.", "match_success": true, "rating": 1 }, { "question": "Are the dolphins swimming towards the shore?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1081092839_reverse": { "direction": [ { "question": "Is the direction of the sun ascending?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the movement pattern of the sun rising?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the sun travel upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the sun descending?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the movement pattern of the sun falling?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the sun travel downwards during sunrise", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059462749_reverse": { "direction": [ { "question": "Is the person moving upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the word 'ascending' describe the movement of the person?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person ascending from a lower point to a higher point?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving downwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the word 'falling' describe the movement of the person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person descending towards a lower point from a higher point?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1088279109_reverse": { "direction": [ { "question": "Is the elevator descending?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the elevator moving down?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is descending the direction of the elevator's movement?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the elevator going up?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is ascending the direction of the elevator's movement?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the elevator stopped?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096612823_reverse": { "direction": [ { "question": "Is the video zooming out?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is direction of movement zooming out?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video changing by zooming out?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video zooming in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video rotating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video panning left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1075484900_reverse": { "direction": [ { "question": "Is the child turning towards the man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the child turning away from the man?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1090578917_reverse": { "direction": [ { "question": "Is the man leaping to his left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man moving towards the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man leaping to his right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man moving forwards?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1075338140_reverse": { "direction": [ { "question": "Is the ball rolling from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ball moving in the direction of rolling from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the ball travel in the direction of rolling from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ball spinning in place?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the ball moving counterclockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the ball rolling from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1067268403_reverse": { "direction": [ { "question": "Are the wind turbines rotating counterclockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the wind turbines rotating clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096007487_reverse": { "direction": [ { "question": "Is the 3d cloud spinning rightward from the camera's point of view?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the 3d cloud spinning rightward as seen from the camera's perspective?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the 3D cloud appear to be rotating rightward from the viewpoint of the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the 3d cloud spinning leftward from the camera's point of view?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the 3d cloud spinning upward from the camera's point of view?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the 3d cloud spinning downward from the camera's point of view?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1095939659_reverse": { "direction": [ { "question": "Is the light growing in a anticlockwise direction?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the direction of the light's movement clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1098785169_reverse": { "direction": [ { "question": "Is the direction of the galaxy's spin counterclockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the galaxy's spin clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099984801_reverse": { "direction": [ { "question": "Are the clouds moving away from the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the clouds moving towards the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the entire video getting brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the entire video turning darker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1082419672_reverse": { "direction": [ { "question": "Is the direction of movement in the video flying forwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the entire video moving forwards relative to the ship?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the direction of movement in the video flying backwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the entire video moving backwards relative to the ship?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1058985719_reverse": { "direction": [ { "question": "Is the airplane flying from top to bottom?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the airplane moving downwards on the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the airplane flying from bottom to top?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the airplane moving upwards on the screen?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055413730_reverse": { "direction": [ { "question": "Is the planet Earth spinning leftwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "According to the camera's perspective, is the rotational movement of the planet Earth spinning to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Based on the camera's viewpoint, is the apparent motion of the Earth spinning to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the planet Earth spinning rightwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "According to the camera's perspective, is the rotational movement of the planet Earth rotating upward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Based on the camera's viewpoint, is the apparent motion of the Earth a complete stop?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1081684532_reverse": { "direction": [ { "question": "Are the asteroids flying away from the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the asteroids flying towards the camera?", "gt-answer": "no", "video-llm-prediction": "No, the asteroids are not flying towards the camera. They are simply floating in space.", "match_success": true, "rating": 1 } ] }, "23391142_reverse": { "direction": [ { "question": "Is the video panning to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the movement of the video about panning to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the scene shifting to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video panning to the right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the movement of the video about zooming in?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the scene shifting to the bottom?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1053758117_reverse": { "direction": [ { "question": "Is the camera zooming out from a 3D digital brain?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera moving in the video by zooming out?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera standing still before a 3D digital brain?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the camera zooming in in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, the camera zooms in on the brain in the video.", "match_success": true, "rating": 0 } ] }, "1106668103_reverse": { "direction": [ { "question": "Is the direction of movement in the video moving backward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the primary motion depicted in the video about moving backward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the primary trajectory in the video involve moving backward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of movement in the video moving forward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the primary motion depicted in the video about moving leftward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the primary trajectory in the video involve moving right ward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1057163434_reverse": { "direction": [ { "question": "Is the chef removing the bread from the burger?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the chef putting the bread on top of the burger?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100319395_reverse": { "direction": [ { "question": "Is the circular pattern moving counter-clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the circular pattern spinning counter-clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the circular pattern spinning in the anticlockwise direction?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the circular pattern moving clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the circular pattern spinning clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the circular pattern spinning in the clockwise direction?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1101200293_reverse": { "direction": [ { "question": "Is the camera motion relative to the aircraft carrier counterclockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera motion relative to the aircraft carrier clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1072453637_reverse": { "direction": [ { "question": "Is the camera panning to the front of a fighter jet?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera panning to the back around a fighter jet?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "3396473605_reverse": { "direction": [ { "question": "Do the five stars disappear from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the five stars appear from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086820415_reverse": { "direction": [ { "question": "Is the large wave moving vertically towards the top of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the large wave move in the direction towards the top of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is moving vertically towards the top the direction of motion of the large wave?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the large wave moving horizontally towards the right side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the large wave move in the direction towards the bottom of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is moving vertically towards the bottom the direction of motion of the large wave?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1073831006_reverse": { "direction": [ { "question": "Are the zebras moving from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the zebras moving from right to left relative to the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the zebras heading leftward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the zebras moving from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the zebras moving away from the camera?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the zebras heading downward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1024867412_reverse": { "direction": [ { "question": "Is the car taking a right left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the car moving in the left direction?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is making a left turn the maneuver the car is making?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the car driving straight in the entire video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the car moving to the right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is making a right turn the maneuver the car is making?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1076877854_reverse": { "direction": [ { "question": "Is the closest robotic arm moving to the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can the closest robotic arm be observed moving to the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the closest robotic arm exhibit movement to the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the closest robotic arm moving towards the camera?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can the closest robotic arm be observed moving to the right side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the closest robotic arm sway back and forth?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100468035_reverse": { "direction": [ { "question": "Is the camera zooming backward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving towards zooming backward?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the camera show zooming backward movement?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera zooming forward?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the camera tracking right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the camera panning left?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Is the door gradually closing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the door changing by gradually closing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the change of the door best described as closing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the door remaining closed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the door changing by gradually opening?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the door gradually opening?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3411806181_reverse": { "direction": [ { "question": "Is the person moving the charging gun away from the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person unplugging the charging gun from the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving the charging gun towards himself?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving the charging gun towards the car?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person performing the action of plugging the charging gun into the car?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person moving the charging gun towards the side of the car?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1073914229_reverse": { "direction": [ { "question": "Do the trains travel away from each other?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the trains travel towards each other?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1093139559_reverse": { "direction": [ { "question": "Is the camera moving in the direction of zooming out?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does zooming out best describe the camera's motion?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving in the direction of zooming in?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is tilting upwards the best description of the camera's motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "attribute_change": [ { "question": "Are the light conditions on the football players turning darker?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it accurate to say that the football players are becoming dimmer?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the light conditions on the football players staying the same?", "gt-answer": "no", "video-llm-prediction": "Yes, the light conditions on the football players are staying the same.", "match_success": true, "rating": 0 }, { "question": "Is it accurate to say that the football players are becoming more visible?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1080591311_reverse": { "direction": [ { "question": "Is the jellyfish floating downwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of motion for the jellyfish downwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is going down the way the jellyfish is moving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the jellyfish moving towards the right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is floating to the left the direction of motion for the jellyfish?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is going up the way the jellyfish is moving?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "3411228673_reverse": { "direction": [ { "question": "Is the direction of the movement in the video downwards among skyscraper buildings?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the path of movement in the video flying downwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera moving upwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the path of movement in the video flying backwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1093737353_reverse": { "direction": [ { "question": "Is the camera panning to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the direction of the camera's movement leftwards?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera panning to the right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the direction of the camera's movement downwards?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1017768724_reverse": { "direction": [ { "question": "Is the person moving leftwards?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person turning leftwards?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person rotating to the left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person moving rightwards?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person turning upwards?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person moving downwards?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1100117263_reverse": { "direction": [ { "question": "Is the little lion's motion upward?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the little lion climbing to the back of an adult lion?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the little lion climbing up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the little lion's motion downward?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the little lion falling from the back of an adult lion?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the little lion going in the direction of falling down?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1021488277_reverse": { "direction": [ { "question": "Is a person dropping down the pineapple?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pineapple being dropped down by a person?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can an individual be observed dropping the pineapple?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a person picking up the pineapple?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the pineapple being rotated by a person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the pineapple being pushed forward by a person?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100397435_reverse": { "direction": [ { "question": "Is the robot vacuum cleaner moving to the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the movement pattern of the robot vacuum cleaner a straight line to the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the robot vacuum cleaner heading to the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the robot vacuum cleaner moving to the right side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "IIs the robot vacuum cleaner moving to the bottom side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the robot vacuum cleaner heading to the upper side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1108534143_reverse": { "direction": [ { "question": "Is the puppy entering a wigwam?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the puppy's movement entering a wigwam?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is entering a wigwam the action the puppy is taking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the puppy staying in a wigwam without going out?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the direction of the puppy's movement walking out of a wigwam?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is walking around a wigwam the action the puppy is taking?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1047368344_reverse": { "direction": [ { "question": "Is the girl jumping out of water?", "gt-answer": "yes", "video-llm-prediction": "No, the girl is not jumping out of water. She is seen running on a wooden bridge and jumping into the water.", "match_success": true, "rating": 0 }, { "question": "In which direction is the girl moving? Is it away from the water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the girl jumping into water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In which direction is the girl moving? Is it towards the water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1050618460_reverse": { "attribute_change": [ { "question": "Are the flowers turning into buds?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the flowers transform from full bloom to bud?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the flowers withering?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Do the flowers transform from bud to full bloom?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1083113449_reverse": { "attribute_change": [ { "question": "Is the sky getting brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "What is occurring to the sky? Is it getting brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sky getting darker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the sky maintaining its brightness?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1091143117_reverse": { "attribute_change": [ { "question": "Is the eye changing from open to closed?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the eye changing from closed to open?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098153561_reverse": { "attribute_change": [ { "question": "Are the leaves changing color from yellow to green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the initial color of the leaves yellow?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the final color of the leaves green?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Are the leaves changing color from green to yellow?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the initial color of the leaves green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the final color of the leaves yellow and red?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059072773_reverse": { "attribute_change": [ { "question": "Is the ice cream freezing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice cream evaporating?", "gt-answer": "yes", "video-llm-prediction": "Yes, the ice cream is evaporating.", "match_success": true, "rating": 1 }, { "question": "Is the ice cream melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the ice cream turning into liquid?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1093573255_reverse": { "attribute_change": [ { "question": "Is the plant wilting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the condition of the plant about withering?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the plant changing in a way that it is fading?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In what way is the plant transforming, is it deteriorating?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the plant reviving?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the condition of the plant about reviving?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the plant changing in a way that it is reviving?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In what way is the plant transforming, is it reviving?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1077146132_reverse": { "attribute_change": [ { "question": "Is the video turning darker?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video decreasing in terms of brightness?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the light condition getting dimmer?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video turning brighter?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the video increasing in terms of brightness?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the light condition getting brighter?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086688682_reverse": { "attribute_change": [ { "question": "Are the traffic lights changing from green to red?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the alteration taking place to the traffic lights transitioning from green to red?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the traffic lights changing from yellow to red?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the alteration taking place to the traffic lights transitioning from red to green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099738787_reverse": { "attribute_change": [ { "question": "Is the concrete wall growing taller?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the concrete wall assembling together?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the concrete wall falling apart?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the concrete wall changing by falling apart?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1094219575_reverse": { "attribute_change": [ { "question": "Are the flowers blooming?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the condition of the flowers blooming?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the transformation occurring to the flowers blooming?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the flowers growing taller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the flowers wilting?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the transformation occurring to the flowers sprouting new buds?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067427023_reverse": { "attribute_change": [ { "question": "Are the snow particles freezing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the primary attribute change experienced by the snow particles freezing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the snow particles melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is scattering the primary attribute change experienced by the snow particles?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1093948229_reverse": { "attribute_change": [ { "question": "Are the golden particles disappearing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is shrinking the best word that represents the change in the attribute of the golden particles?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is contracting the best word that represents the transformation taking place on the golden particles?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the golden particles exploding?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the change in the attribute of the golden particles involve exploding?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the transformation taking place on the golden particles represented by exploding?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1049965795_reverse": { "attribute_change": [ { "question": "Is the light bulb turning off?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "What change occurs in the light bulb? Is it getting darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is turning off the alteration that takes place in the light bulb?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "Is the light bulb lighting up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "What is happening to the light bulb? Is it lighting up?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is lighting up the alteration that takes place in the light bulb?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1052364490_reverse": { "attribute_change": [ { "question": "Is the digital bar chart decreasing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the digital bar chart growing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1080990179_reverse": { "attribute_change": [ { "question": "Is the apple ripening?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the apple becoming juicier?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is getting bigger and softer the change in the apple's attributes?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the apple shrinking and drying out?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the apple getting smaller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is shrinking and drying out the change in the apple's attributes?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1077575504_reverse": { "attribute_change": [ { "question": "Is the pile of salt shrinking?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the attribute change happening to the pile of salt about getting smaller?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt changing by vanishing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt growing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the attribute change happening to the pile of salt about growing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt changing by growing bigger?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "23370985_reverse": { "attribute_change": [ { "question": "Is the ice crystal melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the process occurring with the ice crystal reducing in size?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the transformation taking place in the ice crystal melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice crystal freezing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the process occurring with the ice crystal forming?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the transformation taking place in the ice crystal forming?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055981522_reverse": { "attribute_change": [ { "question": "Are the 3d shapes turning into cubes?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3d shapes changing from sphere into cubes?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3d shapes turning into spheres?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the 3d shapes changing from cubes into spheres?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1081734740_reverse": { "attribute_change": [ { "question": "Is the texture of the leaf turning from yellow to green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the leaf turning into green color?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring in the leaf that it is getting greener?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the texture of the leaf turning from green to yellow?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the leaf turning into yellow color?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the change occurring in the leaf that it is becoming yellow?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093719871_reverse": { "attribute_change": [ { "question": "Are the pink flowers turning from full blossom to withered?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the pink flowers become withered in the end?", "gt-answer": "yes", "video-llm-prediction": "Yes, the pink flowers become withered in the end.", "match_success": true, "rating": 1 }, { "question": "Are the pink flowers falling off petals?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the pink flowers turning from withered to full blossom?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055973887_reverse": { "attribute_change": [ { "question": "Is the fire ball getting smaller?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the fire ball changing its size and shape?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is shrinking in size the way the fire ball is transforming?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the fire ball staying the same size?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is getting bigger the way the fire ball is transforming?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is growing in size the way the fire ball is transforming?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1098710341_reverse": { "attribute_change": [ { "question": "Is the glass going from full of water to empty?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the final state of the glass empty?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the glass going from empty to full of water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is there water in the glass in the final of video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1099116143_reverse": { "attribute_change": [ { "question": "Is white foam disappearing from the surface of the pink liquid?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Can the visual observation of the pink liquid include white foam disappearing from the surface?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is white foam appearing on the surface of the pink liquid?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the pink liquid become green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1025623079_reverse": { "attribute_change": [ { "question": "Is the skyscraper growing taller?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring with the skyscraper being eracted?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the skyscraper collapsing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring with the skyscraper about collapsing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1063373449_reverse": { "attribute_change": [ { "question": "Is the coronavirus assembling together", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the coronavirus dissolving under the attack of antibodies?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1062609286_reverse": { "attribute_change": [ { "question": "Is the battery charge decreasing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the battery charge describe a decrease?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the battery charge increase?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the battery charge staying constant?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1060403198_reverse": { "attribute_change": [ { "question": "Is the tree decreasing its height?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tree undergoing a transformation of becoming shorter?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can we use the term 'shrinking' to describe the change happening to the tree?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tree increasing its height?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the tree undergoing a transformation of becoming taller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can we use the term 'falling down' to describe the change happening to the tree?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099109715_reverse": { "attribute_change": [ { "question": "Is the number of fruits and vegetables becoming smaller?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the change to the fruits and vegetables about disappearing?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is it accurate to say that the number of fruits and vegetables is getting smaller?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the number of fruits and vegetables increasing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change to the fruits and vegetables about increasing number?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is it accurate to say that the number of fruits and vegetables is getting bigger?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1051211272_reverse": { "attribute_change": [ { "question": "Is the toast with cream cheese getting bigger?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the toast with cream cheese grow in size?", "gt-answer": "yes", "video-llm-prediction": "Yes, the toast with cream cheese grows in size as the tomato is added to it.", "match_success": true, "rating": 1 }, { "question": "Is the toast with cream cheese gradually being eaten out and disappearing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the toast with cream cheese disappear completely in the final?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059815936_reverse": { "attribute_change": [ { "question": "Is the paper changing from a flattened sheet into a wrinkled paper ball?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the paper being folded?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the main change occurring in the paper changing from a flattened sheet into a wrinkled paper ball?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the paper changing from a wrinkled paper ball into a flattened sheet?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the paper tearing apart?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the paper unfolding?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059718130_concat_0": { "speed": [ { "question": "Is the sun above rising at the same speed as the sun below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are both suns rising at the same speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun below rising slower than the sun above?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the sun below rising faster than the sun above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059718130_concat_1": { "speed": [ { "question": "Is the sun above rising slower than the sun below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the sun below rising faster than the sun above?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the sun above have a slower speed compared to the sun below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun below rising slower than the sun above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sun above rising faster than the sun below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sun above rising at the same speed as the sun below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059718130_concat_2": { "speed": [ { "question": "Is the speed of the sun above rising faster than the sun below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun above rising faster than the sun below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun below rising faster than the sun above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the speeds of the sun above and the sun below the same?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098153561_concat_0": { "speed": [ { "question": "Does the forest above change color at the same speed as the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of color change in the forest above the same as the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the color change in the forest above happen at the same speed as the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the forest above change color faster than the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of color change in the forest above slower than the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the color change in the forest above occur faster than the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098153561_concat_1": { "speed": [ { "question": "Does the forest above change color slower than the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of color change in the forest above slower than the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speed of the color change in the forest above appear slower than the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the forest above change color faster than the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the speed of color change in the forest above appear to be at the same speed as the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed of color change in the forest above faster than the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1098153561_concat_2": { "speed": [ { "question": "Is the speed that the forest above changing color faster than the forest below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In relation to the speed of the forest below, does the speed of color change in the forest above appear faster?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed that the forest above changing color slower than the forest below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In relation to the speed of the forest below, does the speed of color change in the forest above appear equally fast?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059462749_concat_0": { "speed": [ { "question": "Is the person above climbing at the same speed as the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can it be said that the person above and below are moving at the same speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the person above equal to the speed of the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person above climbing faster than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can it be said that the person above is moving faster than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the person above slower than the speed of the person below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059462749_concat_1": { "speed": [ { "question": "Is the person above climbing slower than the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person above moving slower than the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the person above slower compared to the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person above climbing faster than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the person above moving faster than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the person above the same as the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059462749_concat_2": { "speed": [ { "question": "Is the person above climbing faster than the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can it be said that the person above is moving faster than the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the person above compared to the person below described as climbing faster?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person above climbing at the same speed as the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can it be said that the person above is moving slower than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the person above compared to the person below described as climbing slower?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059072773_concat_0": { "speed": [ { "question": "Is the ice cream above melting at the same speed as the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the melting speed of the ice cream above the same as the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the ice cream above melting faster than the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the ice cream above melting slower than the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059072773_concat_1": { "speed": [ { "question": "Is the ice cream above melting slower than the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the ice cream above melt at a slower speed than the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it true that the ice cream above is melting slower than the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice cream above melting faster than the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the ice cream above melt at the same speed as the ice cream below?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is it correct that the ice cream above is melting at the same speed as the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059072773_concat_2": { "speed": [ { "question": "Is the ice cream above melting faster than the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the melting speed of the ice cream above compare to the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of melting of the ice cream above faster than the ice cream below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ice cream above melting at the same speed as the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the ice cream above melting slower than the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the ice cream above melt at a slower speed compared to the ice cream below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1090578917_concat_0": { "speed": [ { "question": "Is the man above jumping at the same speed as the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the speed of the man above jumping look the same as the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping slower than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed of the man below slower than the man above?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1090578917_concat_1": { "speed": [ { "question": "Is the man above jumping at a slower speed than the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the speed of the man above jumping look slower in comparison to the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping slower than the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping at the same speed as the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed of the man above jumping faster than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are both men jumping at the same speed?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1090578917_concat_2": { "speed": [ { "question": "Is the man above jumping faster than the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speed of the man above jumping look faster in comparison to the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man below jumping slower than the man above?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping at the same speed as the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed of the man above jumping slower in comparison to the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man above jumping slower than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1075338140_concat_0": { "speed": [ { "question": "Is the speed of the ball above moving at the same speed as the ball below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the ball above the same as the speed of the ball below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the ball above moving slower than the ball below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the ball below moving faster than the ball above?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1075338140_concat_1": { "speed": [ { "question": "Is the speed of the ball above slower than the ball below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the ball below moving faster than the ball above?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the ball above described as slower compared to the ball below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the ball above faster than the ball below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the ball above moving at the same speed as the ball below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed of the ball above described as faster compared to the ball below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1075338140_concat_2": { "speed": [ { "question": "Is the ball above moving faster than the ball below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Compared to the ball below, is the speed of the ball above faster?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the ball below moving faster than the ball above?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Compared to the ball below, is the speed of the ball above slower?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1077575504_concat_0": { "speed": [ { "question": "Is the speed of the pile of salt above growing at the same speed as the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt above growing at the same pace as the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the growth rate of the pile of salt above equal to the growth rate of the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the pile of salt above growing at a faster speed than the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pile of salt above growing slower than the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the growth rate of the pile of salt above slower than the growth rate of the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1077575504_concat_1": { "speed": [ { "question": "Is the speed of the pile of salt above growing at a slower speed than the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt above growing slower compared to the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the pile of salt above described as growing slower than the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the pile of salt above growing at a faster speed than the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pile of salt above growing at an equal pace compared to the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the pile of salt above described as growing at the same rate as the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1077575504_concat_2": { "speed": [ { "question": "Is the pile of salt above growing at a faster speed than the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt above growing faster compared to the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the pile of salt above described as growing faster than the pile of salt below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pile of salt above growing at the same speed as the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pile of salt above growing slower compared to the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the pile of salt above described as growing slower than the pile of salt below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100319395_concat_0": { "speed": [ { "question": "Is the white circle above rotating at the same speed as the white circle below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the rotation speed of the white circle above the same as the white circle below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the white circle above rotating faster than the white circle below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the white circle above rotating slower than the white circle below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100319395_concat_1": { "speed": [ { "question": "Is the white circle above rotating faster than the white circle below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the rotation of the white circle above faster compared to the white circle below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the white circle above rotating at the same speed as the white circle below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the rotation of the white circle above slower compared to the white circle below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100319395_concat_2": { "speed": [ { "question": "Is the speed of the white circle above slower than the white circle below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Compared to the white circle below, is the rotation of the white circle above slower?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the white circle above faster than the white circle below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Compared to the white circle below, is the rotation of the white circle above faster?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086820415_concat_0": { "speed": [ { "question": "Is the speed of the wave above the same as the speed of the wave below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the wave above equal to the speed of the wave below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the wave below moving faster than the wave above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the wave above lesser than the wave below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086820415_concat_1": { "speed": [ { "question": "Is the speed of the wave above greater than the wave below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the wave above greater than the speed of the wave below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the wave above moving slower than the wave below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is both waves moving at the same speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086820415_concat_2": { "speed": [ { "question": "Is the wave above moving slower than the wave below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the wave above lesser than the speed of the wave below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the wave above moving at the same speed as the wave below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the wave above greater than the speed of the wave below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096238125_concat_0": { "speed": [ { "question": "Are the two people above lifting the kettlebell at the same speed as the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In relation to the two people below, are the two people above lifting the kettlebell moving at the same speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the two people above lifting the kettlebell move at the same speed as the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the two people above lifting the kettlebell slower than the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In relation to the two people below, are the two people above lifting the kettlebell moving faster?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Do the two people above lifting the kettlebell move slower compared to the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096238125_concat_1": { "speed": [ { "question": "Are the two people above lifting the kettlebell faster than the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the two people above lifting the kettlebell move faster in relation to the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the two people above lifting the kettlebell move faster compared to the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the two people above lifting the kettlebell slower than the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the two people above lifting the kettlebell moving at the same speed as the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the two people above lifting the kettlebell slower when compared to the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096238125_concat_2": { "speed": [ { "question": "Are the two people above lifting the kettlebell slower than the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the two people above lifting the kettlebell moving slower in relation to the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the two people above lifting the kettlebell moving slower relative to the two people below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the two people above lifting the kettlebell at the same speed as the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the two people above lifting the kettlebell faster than the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the two people above lifting the kettlebell moving faster in relation to the two people below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1056433484_concat_0": { "speed": [ { "question": "Is the speed of the earth above the same as the speed of the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speed of the earth above compare to the speed of the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it accurate to say that the speed of the earth above is the same as the speed of the earth below?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the earth above slower than the speed of the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the earth above faster than the speed of the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is it accurate to say that the speed of the earth above rotates faster than the speed of the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1056433484_concat_1": { "speed": [ { "question": "Is the speed of the earth above slower than the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speed of the earth above compare slower to the speed of the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the statement 'It rotates slower than the earth below' accurately describes the speed of the earth above?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the earth above faster than the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the speed of the earth above compare the same as the speed of the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the statement 'It rotates faster than the earth below' accurately describes the speed of the earth above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1056433484_concat_2": { "speed": [ { "question": "Does the earth above rotate faster than the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the earth above faster than the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it accurate to say that the speed of the earth above is faster than the earth below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the earth above rotate at the same speed as the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the earth above slower than the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is it accurate to say that the speed of the earth above is slower than the earth below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "15695290_concat_0": { "speed": [ { "question": "Is the person above drawing a picture at the same speed as the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is it true that they draw at an equal rate in the comparison of the speed of drawing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person above drawing a picture more slowly than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person above drawing a picture faster than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "15695290_concat_1": { "speed": [ { "question": "Is the person above drawing a picture slower than the person below?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "Does the person above draw a picture more slowly compared to the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person below considered faster in drawing compared to the person above?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person above drawing a picture faster than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the person above draw a picture at an equal speed as the person below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person above considered faster in drawing compared to the person below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "15695290_concat_2": { "speed": [ { "question": "Is the person above drawing a picture faster than the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the person above draw a picture more rapidly than the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person above considered faster in drawing compared to the person below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the person above drawing a picture slower than the person below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the person above draw a picture at the same speed as the person below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person below considered faster in drawing compared to the person above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1047368344_concat_0": { "speed": [ { "question": "Is the girl running at the same speed as the girl below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the speed of the girl above compare to the girl below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the speed of the girl above the same as the girl below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the girl running slower than the girl below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the girl running faster than the girl below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the girl above faster than the girl below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1047368344_concat_1": { "speed": [ { "question": "Is the girl above running slower than the girl below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Would you describe the speed of the girl above relative to the girl below as slower?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the speed of the girl above compare to the girl below as the same?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed of the girl above faster than the girl below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1047368344_concat_2": { "speed": [ { "question": "Is the girl above running faster than the girl below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the speed of the girl above compare to the girl below as faster?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Would you describe the speed of the girl above relative to the girl below as faster?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the girl above running at the same speed as the girl below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the speed of the girl above compare to the girl below as slower?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Would you describe the speed of the girl above relative to the girl below as slower?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1060403198_concat_0": { "speed": [ { "question": "Is the speed of the tree above growing at the same speed as the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the tree above grow at the same speed as the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are both trees growing at an equal speed - the tree above and the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tree above growing slower than the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the tree above growing faster than the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the tree below growing at a higher speed than the tree above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1060403198_concat_1": { "speed": [ { "question": "Is the tree above growing faster than the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the tree above grow faster compared to the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tree above growing at a higher speed than the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the tree above growing slower than the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the tree above grow at the same speed as the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the tree below growing at a higher speed than the tree above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1060403198_concat_2": { "speed": [ { "question": "Is the tree above growing slower than the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the tree above grow slower compared to the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the growth of the tree above slower than the tree below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the tree above growing at the same speed as the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the tree above growing faster than the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the growth of the tree above faster than the tree below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100058499_concat_0": { "speed": [ { "question": "Is the man above jumping rope at the same speed as the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the man above jump rope at the same speed as the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are both the man above and the man below jumping rope at the same speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping rope faster than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the man above jumping rope slower than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man above jumping rope at a slower speed compared to the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1100058499_concat_1": { "speed": [ { "question": "Is the man above jumping rope slower than the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping rope at a slower speed compared to the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping rope at a slower speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping rope faster than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man above jumping rope at the same speed as the man below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are both men jumping rope at the same speed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1100058499_concat_2": { "speed": [ { "question": "Is the man above jumping rope faster than the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the man above jump rope faster than the man below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man below jumping rope at a slower speed than the man above?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man above jumping rope slower than the man below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the man below jump rope faster than the man above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is both the man above and the man below jumping rope at the same speed?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1092813279_concat_0": { "speed": [ { "question": "Are the woman below and two women doing push ups at the same speed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the push ups of the woman above and woman below at the same speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the woman above's push ups the same as the woman below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman above doing push ups slower?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the woman above's push ups faster than the woman below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the woman above's push ups have a slower speed compared to the woman below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1092813279_concat_1": { "speed": [ { "question": "Is the woman above doing push ups slower?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the woman above's push ups slower compared to the woman below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed of the woman above's push ups slower compared to the woman below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman below doing push ups slower?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the woman above's push ups faster compared to the woman below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the speed of the woman above's push ups same as the woman below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1092813279_concat_2": { "speed": [ { "question": "Is the woman below doing push ups slower?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the woman above do her push ups faster compared to the woman below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Would you describe the speed of the woman above's push ups as faster compared to the woman below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman above doing push ups slower?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the woman below do her push ups faster compared to the woman above?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Would you describe the speed of the woman above's push ups as slower compared to the woman below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1084518106_concat_0": { "speed": [ { "question": "Is the truck driving at the same speed as the truck below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speed of the truck above compare to the truck below the same?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the truck above moving at a higher speed than the truck below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the truck driving slower than the truck below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1084518106_concat_1": { "speed": [ { "question": "Is the truck above driving faster than the truck below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the truck above have a higher speed compared to the truck below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the truck above moving at a higher speed than the truck below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the truck above driving slower than the truck below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the truck above the same speed as the truck below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the truck below moving at a higher speed than the truck above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1084518106_concat_2": { "speed": [ { "question": "Is the truck above driving slower than the truck below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the speed of the truck above compare to the truck below in terms of being slower?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the truck below moving at a higher speed compared to the truck above?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the truck above driving faster than the truck below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the speed of the truck above compare to the truck below in terms of being the same?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the truck above moving at a higher speed compared to the truck below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1062609286_concat_0": { "speed": [ { "question": "Is the battery charge above increasing at the same speed as the battery charge below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can it be said that the speed at which the battery charge above is increasing equal to the battery charge below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the charging speed above the same as the charging speed below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the battery charge above increasing at a slower speed than the battery charge below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Can it be said that the speed at which the battery charge above is increasing faster than the battery charge below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the charging speed above slower than the charging speed below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1062609286_concat_1": { "speed": [ { "question": "Is the battery charge above increasing at a slower speed than the battery charge below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can it be said that the speed at which the battery charge above is increasing is slower than the battery charge below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the charging speed above slower in relation to the charging speed below?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the battery charge above increasing at a faster speed than the battery charge below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Can it be said that the speed at which the battery charge above is increasing is faster than the battery charge below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the charging speed above the same in relation to the charging speed below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1062609286_concat_2": { "speed": [ { "question": "Is the battery charge above increasing at a faster speed than the battery charge below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can it be said that the speed at which the battery charge above is increasing is faster than the battery charge below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the charging speed above faster compared to the charging speed below?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the battery charge above increasing at a slower speed than the battery charge below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Can it be said that the speed at which the battery charge above is increasing is slower than the battery charge below?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the charging speed above the same as the charging speed below?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1111601171_reverse": { "attribute_change": [ { "question": "Is the sphere building changing from blue to green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sphere building turning green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sphere building transforming by changing from blue to green?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sphere building changing from green to blue?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sphere building turning blue?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sphere building transforming by changing from green to blue?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086105089_reverse": { "attribute_change": [ { "question": "Is the building demolishing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the building getting shorter?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the building being deconstructed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the building being constructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the building growing taller?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the building renovating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1058498242_reverse": { "attribute_change": [ { "question": "Are the 3D pixels changing from the shape of a man into a cuboid?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3D pixels transforming by changing from the shape of a man into a cuboid?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3D pixels changing from a cuboid into the shape of a man?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the 3D pixels transforming by changing from a cuboid into the shape of a man?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1082268005_reverse": { "attribute_change": [ { "question": "Is the planet earth disassembling and disappearing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the planet earth transforming by disassembling and disappearing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the planet earth assembling from toy bricks?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the planet earth splitting into two halves?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1070711428_reverse": { "attribute_change": [ { "question": "Is the glacier assembling and rising from water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is assembling and rising from water occurring to the glacier?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the glacier breaking and falling in water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is breaking and falling in water occurring to the glacier?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1057447372_reverse": { "attribute_change": [ { "question": "Is the sport stadium turning darker?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sport stadium transforming into a darker state?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the sport stadium staying the same brightness?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the sport stadium becoming brighter?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1053334574_reverse": { "attribute_change": [ { "question": "Is the black ink shrinking into the center?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the black ink expanding from the center?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1016172301_reverse": { "attribute_change": [ { "question": "Is the 3D house model being demolished?", "gt-answer": "yes", "video-llm-prediction": "No, the 3D house model is not being demolished. The video shows the model being built and then taken apart.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring to the 3D house model that it is being deconstructed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the 3D house model being constructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring to the 3D house model that it is being constructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1084736389_reverse": { "attribute_change": [ { "question": "Is the face morphing from a human into a chimpanzee?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the face morphing from a chimpanzee into a human?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1054494542_reverse": { "attribute_change": [ { "question": "Is the background changing from blue to pink?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the background transforming into pink?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the main change occurring in the background changing it from blue to pink?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the background changing from pink to blue?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the background turning blue?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the main change occurring in the background changing it from pink to blue?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1055194940_reverse": { "attribute_change": [ { "question": "Is the insect transforming from butterfly into pupa?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring in the insect transforming from butterfly into pupa?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the insect transforming from pupa into butterfly?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring in the insect transforming from dead to live?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1079384099_reverse": { "attribute_change": [ { "question": "Is the 3d pixel transforming from the shape of a flower into a white square?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the final shape of the 3d pixel a square?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the 3d pixel transform from a flower to a square?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the 3d pixel transforming from the shape of a white square into a flower?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the final shape of the 3d pixel a flower?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the 3d pixel transform from a heart to a flower?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099811331_reverse": { "attribute_change": [ { "question": "Is the 3d heart gradually disappearing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the 3d heart gradually appearing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093340469_reverse": { "attribute_change": [ { "question": "Is the room turning brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the word 'brightening' best describe the change in the room?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the attribute of the room brightening up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the room staying the same brightness?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the word 'darkening' best describe the change in the room?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the attribute of the room becoming darker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1111601171": { "attribute_change": [ { "question": "Is the sphere building changing from green to blue?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sphere building turning blue?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sphere building transforming by changing from green to blue?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sphere building changing from blue to green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sphere building turning green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sphere building transforming by changing from blue to green?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086105089": { "attribute_change": [ { "question": "Is the building constructed?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the building getting taller?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the building being constructed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the building being deconstructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the building growing shorter?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the building renovating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1058498242": { "attribute_change": [ { "question": "Are the 3D pixels changing from a cuboid into the shape of a man?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the 3D pixels transforming by changing from a cuboid into the shape of a man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the 3D pixels changing from the shape of a man into a cuboid?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the 3D pixels transforming by changing from the shape of a man into a cuboid?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1082268005": { "attribute_change": [ { "question": "Is the planet earth assembling from toy bricks?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the planet earth transforming by assembling from toy bricks?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the planet earth disassembling and disappearing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the planet earth splitting into two halves?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1070711428": { "attribute_change": [ { "question": "Is the glacier breaking and falling in water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is breaking and falling in water occurring to the glacier?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the glacier assembling and rising from water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is assembling and rising from water occurring to the glacier?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1057447372": { "attribute_change": [ { "question": "Is the sport stadium turning brighter?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the sport stadium transforming into a brighter state?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sport stadium staying the same brightness?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the sport stadium becoming darker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1053334574": { "attribute_change": [ { "question": "Is the black ink expanding from the center?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the black ink shrinking into the center?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1016172301": { "attribute_change": [ { "question": "Is the 3D house model being constructed?", "gt-answer": "yes", "video-llm-prediction": "Yes, the 3D house model is being constructed.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring to the 3D house model that it is being constructed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the 3D house model being demolished?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring to the 3D house model that it is being deconstructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1084736389": { "attribute_change": [ { "question": "Is the face morphing from a chimpanzee into a human?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the face morphing from a human into a chimpanzee?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1054494542": { "attribute_change": [ { "question": "Is the background changing from pink to blue?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the background turning blue?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the main change occurring in the background changing it from pink to blue?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the background changing from blue to pink?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the background transforming into pink?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the main change occurring in the background changing it from blue to pink?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1055194940": { "attribute_change": [ { "question": "Is the insect transforming from pupa into butterfly?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the change occurring in the insect transforming from pupa into butterfly?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the insect transforming from butterfly into pupa?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the change occurring in the insect transforming from dead to live?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1079384099": { "attribute_change": [ { "question": "Is the 3d pixel transforming from the shape of a white square into a flower?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the final shape of the 3d pixel a flower?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the 3d pixel transform from a square to a flower?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the 3d pixel transforming from the shape of a flower into a white square?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the final shape of the 3d pixel a square?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the 3d pixel transform from a heart to a flower?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1099811331": { "attribute_change": [ { "question": "Is the 3d heart gradually appearing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the 3d heart gradually disappearing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093340469": { "attribute_change": [ { "question": "Is the room turning darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the word 'darkening' best describe the change in the room?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the attribute of the room becoming darker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the room staying the same brightness?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the word 'brightening' best describe the change in the room?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the attribute of the room brightening up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_0": { "order": [ { "question": "Are the sun rising and ice cream melting at the same time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do sun rising and ice cream melting occur simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sun rising happening before ice cream melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the ice cream melting and sun rising happening at different times?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_1": { "order": [ { "question": "Does the ice cream melt before the sun rises?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the ice cream melt and then the sun rises in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the sun rise before the ice cream melts in the video?", "gt-answer": "no", "video-llm-prediction": "Yes, the sun rises before the ice cream melts in the video.", "match_success": true, "rating": 0 }, { "question": "Do both events occur at the same time in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1059072773_1059718130_2": { "order": [ { "question": "Does the sun rise before the ice cream melts?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the sequence of events in the video sun rising and ice cream melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the ice cream melt before the sun rises?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sequence of events in the video ice cream melting and sun rising?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1024867412_1034049020_0": { "order": [ { "question": "Is a girl walking on the street while a dog is simultaneously driving?", "gt-answer": "yes", "video-llm-prediction": "No", "match_success": true, "rating": 0 }, { "question": "Is a girl walking on the street while a dog is driving at the same time?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a girl walk on the street before the dog starts driving?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is a girl walking on the street followed by a dog driving in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1024867412_1034049020_1": { "order": [ { "question": "Is a dog driving and then a girl walking on the street?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video show a sequence of a dog driving, followed by a girl walking on the street?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a girl walking on the street and then a dog driving?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the video show a sequence of a girl walking on the street, followed by a dog driving?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1024867412_1034049020_2": { "order": [ { "question": "Is a girl walking on the street, then a dog is driving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a girl walking on the street occur before a dog driving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a dog driving, then a girl is walking on the street?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does a dog driving occur before a girl walking on the street?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1096238125_1098970151_0": { "order": [ { "question": "Are two people lifting weights at the same time as a cat licking its paw?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is a cat licking its paw while concurrently two people are lifting weights happening in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are two people lifting weights after a cat licking its paw?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does two people lifting weights followed by a cat licking its paw happen in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1096238125_1098970151_1": { "order": [ { "question": "Are two people lifting weights and then a cat is licking its paw in the video?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is a cat licking its paw followed by two people lifting weights?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1096238125_1098970151_2": { "order": [ { "question": "Is a cat licking its paw and then two people lifting weights?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a cat lick its paw before two people lift weights?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is two people lifting weights and then a cat is licking its paw?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does two people lifting weights happen before a cat licking its paw?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_0": { "order": [ { "question": "Are the woman and the man showing different expressions at the same time?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the video presenting the woman and man showing their expressions simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the woman and man show their expressions at the same time?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man showing different expressions before the woman?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the woman showing different expressions before the man?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the woman and the man appearing at different time?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_1": { "order": [ { "question": "Does the video show the woman showing different expressions first, followed by the man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is it true that the man shows his expressions first, followed by the man?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1069717165_1041584314_2": { "order": [ { "question": "Is the order of events in the video: First, a man is showing different expressions; then, a woman is showing different expressions?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the video, does the man present his expressions first, followed by the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video: Both the woman and the man are showing different expressions at the same time?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In the video, does the woman present her expressions first, followed by the man?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_0": { "order": [ { "question": "Is the correct order of events in the video the fire ball expanding, while simultaneously the earth is spinning?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the correct order of events in the video the fire ball expanding, then the earth is spinning?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_1": { "order": [ { "question": "Is the correct order of events in the video about the earth spinning first and then the fire ball expanding?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the correct order of events in the video about the fire ball expanding first and then the earth spinning?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1055413730_1055973887_2": { "order": [ { "question": "Is the correct order of events in the video that the fire ball is expanding, then the earth is spinning?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the earth spinning before the fire ball is expanding in the correct order of events in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_0": { "order": [ { "question": "Is a person picking up a pineapple and a squirrel foraging happening concurrently in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a squirrel foraging and a person picking up a pineapple at the same time in the video?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is a person picking up a pineapple and then a squirrel foraging in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is a squirrel foraging and then a person picking up a pineapple in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_1": { "order": [ { "question": "Is a squirrel foraging and then a person picking up a pineapple in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In the video, is the first event a squirrel foraging and then a person picking up a pineapple?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "According to the video, does a squirrel forage before a person picks up a pineapple?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a person picking up a pineapple and then a squirrel foraging in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In the video, is the first event a person picking up a pineapple and then a squirrel foraging?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "According to the video, does a person pick up a pineapple before a squirrel starts foraging?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1058907236_1021488277_2": { "order": [ { "question": "Is a person picking up a pineapple and then a squirrel is foraging?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the video, are events happening in the sequence: first, a person is picking up a pineapple; then, a squirrel is foraging?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "According to the arrangement of events in the video, does a person pick up a pineapple before a squirrel starts foraging?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a squirrel foraging before a person picks up a pineapple?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is a person picking up a pineapple and a squirrel foraging happening concurrently in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "According to the arrangement of events in the video, does a squirrel start foraging before a person picks up a pineapple?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1054717541_1047368344_0": { "order": [ { "question": "Are a person kneading dough and a girl jumping into water occurring at the same time in the video?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is a person kneading dough occurring after a girl jumping into water in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1054717541_1047368344_1": { "order": [ { "question": "Is the sequence of events in the video a person kneading dough followed by a girl jumping into water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the sequence of events in the video a girl jumping into water followed by a person kneading dough?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1054717541_1047368344_2": { "order": [ { "question": "Does the sequence of events in the video start with a girl jumping into water and then a person kneading dough?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the sequence of events in the video start with a person kneading dough and then a girl jumping into water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1089201973_1086820415_0": { "order": [ { "question": "Is a person kicking football shown at the same time as a big wave?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do a person kicking football and a big wave being shown happen together in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the first event shown in the video a person kicking football before by a big wave?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video a person kicks football and then a big wave is shown?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1089201973_1086820415_1": { "order": [ { "question": "Is a person kicking football shown before a big wave in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a person kicking football shown after a big wave in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1089201973_1086820415_2": { "order": [ { "question": "Is the order of events in the video that a big wave is shown and then a person is kicking football?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a person is kicking football and then a big wave is shown?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1080990179_1086820415_0": { "order": [ { "question": "Are an apple drying out and a big wave shown at the same time?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is it correct that an apple drying out and a big wave are shown simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is an apple drying out first and then a big wave is shown?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is a big wave shown first and then an apple is drying out?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1080990179_1086820415_1": { "order": [ { "question": "Is the order of events in the video that an apple is drying out first and then a big wave is shown?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a big wave is shown first and then an apple is drying out?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1080990179_1086820415_2": { "order": [ { "question": "Does the video show a big wave before an apple drying out?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does an apple drying out happen after a big wave is shown in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are both events (an apple drying out and a big wave shown) happening simultaneously in the video?", "gt-answer": "no", "video-llm-prediction": "No. The video shows a drying apple and a big wave in the ocean, but they are not happening simultaneously. The video shows the apple drying out in a dark room, while the big wave is shown in the ocean.", "match_success": true, "rating": 1 }, { "question": "Is a big wave shown later in the video compared to an apple drying out?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1067268403_1064645467_0": { "order": [ { "question": "Are a man doing exercise and wind turbines rotating concurrently in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video wind turbines rotating followed by a man doing exercise?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1067268403_1064645467_1": { "order": [ { "question": "Is the order of events in the video: Wind turbines are rotating followed by a man doing exercise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video: A man doing exercise followed by wind turbines rotating?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1067268403_1064645467_2": { "order": [ { "question": "Is the order of events in the video a man doing exercise followed by wind turbines rotating?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is wind turbines rotating followed by a man doing exercise, the order of events in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_0": { "order": [ { "question": "Does the video show that viruses dissolving and planet earth assembling from toy bricks happening simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the video show that viruses are dissolving and then planet earth is assembling from toy bricks?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_1": { "order": [ { "question": "Are the events in the video happening in the order of planet earth assembling from toy bricks and then viruses dissolving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the events in the video happening in the order of viruses dissolving and then planet earth assembling from toy bricks?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1082268005_1063373449_2": { "order": [ { "question": "Are the events in the video happening in the order of viruses dissolving and then planet earth assembling from toy bricks?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the events in the video happening in the order of planet earth assembling from toy bricks and then viruses dissolving?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_0": { "order": [ { "question": "Do the events happen simultaneously, with a light bulb lighting up while the tree is growing up?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a light bulb is lighting up and then the tree is growing up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_1": { "order": [ { "question": "Are the events in the video ordered as the tree growing up and then a light bulb lighting up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the tree growing up and then a light bulb lighting up the order of events in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a light bulb is lighting up and then the tree is growing up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is a light bulb lighting up and then the tree growing up the order of events in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1060403198_1049965795_2": { "order": [ { "question": "Is the order of events in the video that a light bulb is lighting up and then the tree is growing up?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a light bulb lighting up and then the tree growing up the order of events in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the events in the video ordered as the tree growing up and then a light bulb lighting up?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the tree growing up and then a light bulb lighting up the order of events in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1091143117_1094219575_0": { "order": [ { "question": "Does the opening of the eye happen simultaneously as the wilting of the flower?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the eye opening while at the same time the flower is wilting", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is an eye opening before a flower wilts?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is a flower wilting before an eye opens?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1091143117_1094219575_1": { "order": [ { "question": "Does the eye open first and then the flower wilts?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the opening of the eye happen before the wilting of the flower?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that the eye opens first and then the flower wilts?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the flower wilt first and then the eye opens?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Does the wilting of the flower happen before the opening of the eye?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video that the flower wilts first and then the eye opens?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1091143117_1094219575_2": { "order": [ { "question": "Is a flower wilting first and then an eye opening?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a flower wilt first before an eye opens?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the events in the video occurring in the order of a flower wilting first and then an eye opening?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is an eye opening first and then a flower wilting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does an eye open first before a flower wilts?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Do the events in the video occur in the order of an eye opening first and then a flower wilting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086105089_1085910917_0": { "order": [ { "question": "Does a woman drink water while a building is being constructed simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a building being constructed shown at the same time as a woman drinking water?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a building being constructed happen before a woman drinking water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does a building is being constructed comes first, followed by a woman drinking water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086105089_1085910917_1": { "order": [ { "question": "Does the building being constructed happen before a woman is drinking water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does a building being constructed come first, followed by a woman drinking water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is it true that the building being constructed happens before a woman is drinking water?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does a woman is drinking water happen before a building is being constructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does a woman is drinking water come first, followed by a building being constructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is it true that a woman is drinking water happens before a building is being constructed?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086105089_1085910917_2": { "order": [ { "question": "Does a woman drink water before a building is being constructed?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the event of a woman drinking water happen before the event of a building being constructed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a woman drinking water come before a building being constructed in sequence?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does a building being constructed come first before a woman drinking water?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the event of a building being constructed happen before the event of a woman drinking water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does a building being constructed come before a woman drinking water in sequence?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1034736653_1043054206_0": { "order": [ { "question": "Do car race and women run happen at the same time in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does cars race happen before women run in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1034736653_1043054206_1": { "order": [ { "question": "Do the events occur in the order of women running, then cars racing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the events occur in the order of cars racing, then women running?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1034736653_1043054206_2": { "order": [ { "question": "Do the events occur in the order of cars racing, then women running?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Do the events occur in the order of women running, then cars racing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_0": { "order": [ { "question": "Does the event of a dog giving a high five to a woman happen simultaneously with foods being added into a bowl in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the chronological order of events in the video that foods are added into a bowl, and then a dog is giving a high five to a woman?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_1": { "order": [ { "question": "Is the correct chronological order of events in the video that foods are added into a bowl, and then a dog gives a high five to a woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the correct chronological order of events in the video that a dog gives a high five to a woman, and then foods are added into a bowl?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1086423566_1094782389_2": { "order": [ { "question": "Is the correct chronological order of the events in the video: 'A dog is giving a high five to a woman, and then foods are added into a bowl'?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the correct chronological order of the events in the video: 'Foods are added into a bowl, and then a dog is giving a high five to a woman'?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1053758117_1055413730_0": { "order": [ { "question": "Are the digital brain spinning and the earth spinning happening together?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the digital brain spinning happening after the earth is spinning?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1053758117_1055413730_1": { "order": [ { "question": "Does the digital brain spin before the earth in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video: the digital brain spins and then the earth spins?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the earth spin before the digital brain in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video: the earth spins and then the digital brain spins?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1053758117_1055413730_2": { "order": [ { "question": "Does the earth spin before the digital brain in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video: the earth spins and then the digital brain spins?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the digital brain spin before the earth in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video: the digital brain spins and then the earth spins?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1076877854_1073914229_0": { "order": [ { "question": "Are robotic arms and trains shown at the same time in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is it true that robotic arms working and trains driving happen simultaneously in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the robotic arms working before trains start driving in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is it true that robotic arms working after trains driving in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1076877854_1073914229_1": { "order": [ { "question": "In the video, do the events occur with the robotic arms working first, and then the trains driving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the video, do the events occur with the trains driving first, and then the robotic arms working?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1076877854_1073914229_2": { "order": [ { "question": "In the video, do the events occur with the trains driving first, and then the robotic arms working?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "In the video, do the events occur with the robotic arms working first, and then the trains driving?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067268406_1067427023_0": { "order": [ { "question": "Is a white car driving while snow particles are melting simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a white car is driving while snow particles are melting simultaneously?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is a white car driving happens before snow particles are melting", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video that a white car is driving, then snow particles are melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067268406_1067427023_1": { "order": [ { "question": "Is the order of events in the video that a white car is driving, then snow particles are melting?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that snow particles are melting, then a white car is driving?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1067268406_1067427023_2": { "order": [ { "question": "Is the order of events in the video that snow particles are melting, then a white car is driving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that a white car is driving, then snow particles are melting?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1086286649": { "action": [ { "question": "Are the armored vehicles driving?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is driving the main action performed by the armored vehicles?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the armored vehicles loading people?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the armored vehicles firing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ], "direction": [ { "question": "Are the armored vehicles moving from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the armored vehicles approaching from the left side of the screen?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the armored vehicles proceeding from right to left?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the armored vehicles from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the armored vehicles approaching from the right side of the screen?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Are the armored vehicles proceeding from left to right?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "speed": [ { "question": "Are the armored vehicles moving slowly?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pace of the armored vehicles slow?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Would you describe the movement of the armored vehicles as slow?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the armored vehicles moving rapidly?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the pace of the armored vehicles fast?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Would you describe the movement of the armored vehicles as quickly?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093041749": { "action": [ { "question": "Can the dragon perform the action of breathing fire?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the dragon engage in the activity of breathing fire?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can the dragon perform the action of eating food?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the dragon engage in the activity of laying eggs?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Is the dragon landing from the sky and then breathing fire?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is landing from the sky and then breathing fire the order of events performed by the dragon?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the dragon breathing fire and then landing from the sky?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is breathing fire and then landing from the sky the order of events performed by the dragon?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1076180768": { "action": [ { "question": "Is the knight drawing sword from sheath?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the action of the knight about drawing sword from sheath?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is drawing sword from sheath what the knight is demonstrating?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the knight putting on armor?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the action of the knight about shooting an arrow?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is raising a shield what the knight is demonstrating?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3406661033": { "action": [ { "question": "Is the man propelling himself forward in a wheelchair?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is propelling himself forward in a wheelchair the action that the man is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man moving by propelling himself forward in a wheelchair?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man swimming?", "gt-answer": "no", "video-llm-prediction": "No, the man is not swimming. He is sitting at a table with a woman.", "match_success": true, "rating": 1 }, { "question": "Is running the action that the man is performing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man crawling?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Did the man propel himself forward in wheelchair and then hand the document to colleagues?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the man hand the document to colleagues and then propel himself forward in wheelchair?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "3406618583": { "action": [ { "question": "Is the woman performing freestyle dance?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in freestyle dance?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman demonstrating freestyle dance?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman performing hip-hop?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman engaged in ballet?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman demonstrating jazz dance?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the camera moving by panning up and down around the girl in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera movement in the video by panning up and down around the girl?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving around the girl in the video by panning up and down?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the camera moving by panning left and right around the girl in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the camera movement in the video by rotating clockwise around the girl?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera moving in the video by zooming in and out around the girl?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "3405120819": { "action": [ { "question": "Is the chef shaping dough?", "gt-answer": "yes", "video-llm-prediction": "Yes, the chef is seen shaping dough in the video.", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the chef about shaping dough?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is shaping dough an activity that the chef is engaging in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the chef cutting dough?", "gt-answer": "no", "video-llm-prediction": "Yes, the chef is cutting dough in the video.", "match_success": true, "rating": 0 }, { "question": "Is the action performed by the chef about mixing dough with water?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is baking dough the activity that the chef is engaging in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ], "order": [ { "question": "Does the chef perform shaping dough before smiling at the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the chef smiling at the camera before shaping dough?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "3405088753": { "action": [ { "question": "Is the woman buying bread in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is buying bread the action performed by the woman in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is buying bread the activity the woman is engaged in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman cooking soup in the video?", "gt-answer": "no", "video-llm-prediction": "No, the video does not show the woman cooking soup. It only shows the man and woman in the bakery.", "match_success": true, "rating": 1 }, { "question": "Is dancing the action performed by the woman in the video?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is painting the activity the woman is engaged in?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "order": [ { "question": "Is the salesman packing up the bread before saying something to the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the salesman saying something to the woman before packing up the bread?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3401191309": { "action": [ { "question": "Is the athletic man taking off the prosthetic running blade?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is taking off the prosthetic running blade the action that the athletic man is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the athletic man putting on the prosthetic running blade?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is repairing a prosthetic running blade the action that the athletic man is performing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "21218935": { "action": [ { "question": "Is the woman exercising?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in exercising?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is exercising the action that the woman is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman cooking?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not cooking. She is shown doing sit-ups and smiling at the camera.", "match_success": true, "rating": 1 }, { "question": "Is the woman dancing?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not dancing. She is seen doing sit-ups while sitting on a bench.", "match_success": true, "rating": 1 }, { "question": "Is the woman painting?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not painting. She is shown doing sit-ups and smiling at the camera.", "match_success": true, "rating": 1 } ], "order": [ { "question": "Is the woman doing push ups and then smiling at the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "In which order does the woman perform the actions, doing push ups and then smiling at the camera?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman smiling at the camera and then doing push ups?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "In which order does the woman perform the actions, smiling and then doing push ups?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "5395244": { "action": [ { "question": "Is the woman walking across the creek?", "gt-answer": "yes", "video-llm-prediction": "Yes, the woman is walking across the creek.", "match_success": true, "rating": 1 }, { "question": "Is the woman interacting with the creek by walking across it?", "gt-answer": "yes", "video-llm-prediction": "Yes. The woman is seen walking across the creek in the video.", "match_success": true, "rating": 1 }, { "question": "Is walking across the pebble creek the activity the woman is engaged in at the moment?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman swimming across the creek?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman canoeing across the creek?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is running across the pebble creek the activity the woman is engaged in at the moment?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1037628617": { "action": [ { "question": "Is the person clicking button and rolling wheel on a mouse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person's action about clicking button and rolling wheel on a mouse?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is clicking button and rolling wheel on a mouse what the person is doing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person pressing a keyboard key and rotating a jog dial?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the person tapping a touchpad and scrolling with two fingers?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is pressing a keyboard key and rotating a jog dial what the person is doing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1066801717": { "action": [ { "question": "Is the woman arranging bouquet of daffodils?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is arranging bouquet of daffodils the action performed by the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman cutting bouquet of daffodils?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not cutting the bouquet of daffodils. She is holding the vase and talking to the camera.", "match_success": true, "rating": 1 }, { "question": "Is watering bouquet of daffodils the action performed by the woman?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1088428381": { "action": [ { "question": "Is the woman opening a gift box in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes. The woman is seen opening a gift box in the video.", "match_success": true, "rating": 1 }, { "question": "Is the woman performing the action of opening a gift box?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Can the action of opening a gift box be observed from the woman in the video?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the woman storing items in a gift box in the video?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the woman delivering a gift box in the video?", "gt-answer": "no", "video-llm-prediction": "Yes. The woman is seen holding a gift box and giving it to someone.", "match_success": true, "rating": 0 }, { "question": "Is the woman wrapping a gift box in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1069593640": { "action": [ { "question": "Is the woman putting a towel on her neck?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is putting a towel on her neck the action being performed by the woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman drying hair with a towel?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is washing face with a towel the action being performed by the woman?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "8307961": { "order": [ { "question": "Is the man chatting with a woman while walking and then showing something on his tablet to a woman?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man walking and simultaneously showing something on his tablet to a woman?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "15439453": { "action": [ { "question": "Are they tango dancing and playing saxophone in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are tango dancing and playing saxophone the two actions depicted in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is a girl playing saxophone in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are they ballet dancing and playing saxophone in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are tango dancing and playing violin the two actions depicted in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is a boy playing saxophone in the video?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1107947873": { "action": [ { "question": "Is the doctor giving medicine to a patient?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is giving medicine to a patient the primary role of the doctor in the scene?", "gt-answer": "yes", "video-llm-prediction": "No. The doctor is also seen examining the patient's hand and giving them a piece of cake.", "match_success": true, "rating": 0 }, { "question": "Is giving medicine to a patient an activity seen in the video involving the doctor?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the doctor writing a prescription?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is checking vitals the primary role of the doctor in the scene?", "gt-answer": "no", "video-llm-prediction": "No. The doctor is also seen holding a cup of coffee and a piece of cake, as well as a cell phone.", "match_success": true, "rating": 1 }, { "question": "Is performing a surgery an activity seen in the video involving the doctor?", "gt-answer": "no", "video-llm-prediction": "No, the video does not show the doctor performing a surgery. The video only shows the doctor sitting at a table and talking to a woman.", "match_success": true, "rating": 1 } ] }, "1081194848": { "action": [ { "question": "Is the researcher teaching children how to dissect a frog?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people engaged in dissecting a frog?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the task that the researcher performing with the children about dissecting a frog?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the researcher teaching children how to cook a frog?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the people engaged in feeding a frog?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the task that the researcher performing with the children about catching a frog?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1091526823": { "action": [ { "question": "Is the hand turning over pages of a book?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the hand about turning over pages of a book?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is turning over pages of a book what the hand is doing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the hand opening a book?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the action performed by the hand about writing on a book?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is closing a book what the hand is doing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "26631100": { "order": [ { "question": "Are three hands holding the clay pot first and then two hands are holding the clay pot?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video that three hands are holding the clay pot first and then two hands are holding the clay pot?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are two hands holding the clay pot first and then three hands are holding the clay pot?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the order of events in the video that two hands are holding the clay pot first and then three hands are holding the clay pot?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1104663381": { "action": [ { "question": "Is the man stretching a pizza dough?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in stretching a pizza dough while being filmed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man cutting a pizza dough?", "gt-answer": "no", "video-llm-prediction": "No, the man is not cutting a pizza dough. He is making a ball of dough.", "match_success": true, "rating": 1 }, { "question": "Is the man folding a pizza dough?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ], "direction": [ { "question": "Is the pizza dough rotating counter-clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the pizza dough moving in the direction of rotating counter-clockwise?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the pizza dough rotating clockwise?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the pizza dough moving in the direction of flipping up and down?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "22100041": { "action": [ { "question": "Is the woman doing an invitation gesture?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman performing the action of doing an invitation gesture?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "When captured on video, is the woman engaged in doing an invitation gesture?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman waving goodbye?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the woman pointing towards something?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the woman clapping her hands?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1103623921": { "action": [ { "question": "Is the man playing pool?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in playing pool?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is playing pool the action the man is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man playing football?", "gt-answer": "no", "video-llm-prediction": "No, the man is playing pool.", "match_success": true, "rating": 1 }, { "question": "Is the man sleeping?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is reading books the action the man is performing?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ], "speed": [ { "question": "Is the speed that the video is playing normal speed?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Would you describe the speed at which the video is playing as normal?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "What playback rate is the video currently at - normal pace?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the speed that the video is playing slow-motion?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed that the video is playing fast-forward?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the speed that the video is playing stopped?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1093338031": { "action": [ { "question": "Is the man attempting to punch a computer screen?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is punching a computer screen the action that the man is trying to perform?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is attempting to punch a computer screen the man's activity in the video?", "gt-answer": "yes", "video-llm-prediction": "No.", "match_success": true, "rating": 0 }, { "question": "Is the man attempting to fix a computer screen?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is cleaning a computer screen the action that the man is trying to perform?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is attempting to click a computer screen the man's activity in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1064310466": { "action": [ { "question": "Is the man peeling cocoa seeds?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man involved in the activity of peeling cocoa seeds?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man watering cocoa seeds?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the man involved in the activity of baking cocoa seeds?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1088497853": { "direction": [ { "question": "Is the direction of the movement in the video upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the camera moving upwards before the stone building?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the trajectory of the camera movement in the video flying upwards?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the direction of the movement in the video downwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the camera moving rightwards before the stone building?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the trajectory of the camera movement in the video flying leftwards?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1106087175": { "action": [ { "question": "Is the man drawing on a white sneaker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in drawing on a white sneaker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Which action can be observed in the video: drawing on a white sneaker?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man taking off a white sneaker?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the man tying shoelaces on a white sneaker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the man wearing a white sneaker?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "13324343": { "order": [ { "question": "Does the man tie his shoelaces and then glide on the skateboard?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the sequence of actions, does the man tie his shoelaces and then glide on the skateboard?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is tying his shoelaces and then gliding on the skateboard the correct order of actions by the man?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does the man glide on the skateboard and then tie his shoelaces?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "In the sequence of actions, does the man glide on the skateboard and then tie his shoelaces?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is glide on the skateboard and then tying his shoelaces the correct order of actions by the man?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1083624811": { "action": [ { "question": "Is the woman performing alternating leg lift plank?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman carrying out the action of performing alternating leg lift plank?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in the activity of performing alternating leg lift plank?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman performing push-ups?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman carrying out the action of performing side plank variations?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the woman engaged in the activity of performing a traditional plank hold?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1014976360": { "order": [ { "question": "Does the man look at his phone and then taking off his glasses?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the man take off his glasses and then look at his phone?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "18416608": { "order": [ { "question": "Is the woman sampling water in a bottle first, then operating her tablet?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman operating her tablet first, then sampling water in a bottle?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1061351290": { "order": [ { "question": "Does the woman touch her pregnant belly before measuring her belly with a measuring tape?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the order of events in the video involving the woman about touching her pregnant belly and then measuring her belly with a measuring tape?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the woman perform the action of touching her pregnant belly before measuring her belly with a measuring tape?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the woman take off clothes after measuring her belly with a measuring tape?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the sequence of actions in the video involving the woman about measure her belly with a measuring tape and then touching her pregnant belly?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does the woman measure her belly with a measuring tape before touching her pregnant belly?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1066238617": { "action": [ { "question": "Is the woman practising her punches?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in practising her punches?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is practising her punches the action that the woman is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman dancing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman engaged in singing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is playing chess the action that the woman is performing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1072000366": { "action": [ { "question": "Are the girls elbowing each other?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the girls engaged in the action of elbowing each other?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the girls involved in the activity of elbowing each other?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the girls waving at each other?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Are the girls shaking hands?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the girls engaged in the action of giving high five to each other?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1065272113": { "action": [ { "question": "Is the doctor giving the woman an injection?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the action of the doctor on the woman about giving an injection?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is giving an injection the primary action of the doctor?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the doctor taking the woman's blood pressure?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the action of the doctor on the woman about writing a prescription?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is applying bandage the action the doctor is engaged in?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1072971926": { "action": [ { "question": "Is the man opening the pizza box?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the man about opening the pizza box?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is opening the pizza box what the man is doing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man eating the pizza?", "gt-answer": "no", "video-llm-prediction": "No, the man is not eating the pizza. He is holding it and looking at it.", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the man about closing the pizza box?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is wrapping the pizza box what the man is doing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "3399348431": { "action": [ { "question": "Is the person squeezing the sauce into a bowl of vegetables?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video showing the action of squeezing the sauce into a bowl of vegetables?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person mixing the sauce with the vegetables?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video showing the action of dipping vegetables on the sauce?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1025137214": { "action": [ { "question": "Is the man smoking a cigarette?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in smoking a cigarette?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is smoking a cigarette the activity the man is involved in?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man walking?", "gt-answer": "no", "video-llm-prediction": "No, the man is not walking. He is lying on the ground and smoking a cigarette.", "match_success": true, "rating": 1 }, { "question": "Is the man reading a book?", "gt-answer": "no", "video-llm-prediction": "No, the man is not reading a book. He is smoking a cigarette and looking at the city.", "match_success": true, "rating": 1 }, { "question": "Is playing soccer the activity the man is involved in?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1033101626": { "action": [ { "question": "Is the man playing an instrument?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in playing an instrument?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is playing an instrument the action that the man is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man cooking?", "gt-answer": "no", "video-llm-prediction": "No, the man is not cooking. He is playing a musical instrument.", "match_success": true, "rating": 1 }, { "question": "Is the man reading?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the man playing an instrument and dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "9537677": { "action": [ { "question": "Is the woman playing tablet?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman's action in the video about playing tablet?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is playing tablet the main focus of the woman's attention?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman reading a book?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not reading a book. She is using her phone to text and browse the internet.", "match_success": true, "rating": 1 }, { "question": "Is the woman dancing?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not dancing. She is sitting on a bench and looking at her phone.", "match_success": true, "rating": 1 }, { "question": "Is listening to music the main focus of the woman's attention?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1077388994": { "action": [ { "question": "Is the woman patting the baby?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in patting the baby?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is patting the baby what the woman is doing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman singing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the woman cooking dinner?", "gt-answer": "no", "video-llm-prediction": "No, the woman is not cooking dinner. She is holding a baby in her arms and smiling at the camera.", "match_success": true, "rating": 1 }, { "question": "Is writing a letter what the woman is doing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1037531786": { "action": [ { "question": "Are the two men boxing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is boxing the physical activity that the two men are engaged in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the two men participating in boxing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the two men dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is swimming the physical activity that the two men are engaged in?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is basketball the sport that the two men are participating in?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1077275024": { "action": [ { "question": "Is the girl clapping hands for a man playing ukulele?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the girl engaged in clapping hands for a man playing ukulele?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is clapping hands for a man playing ukulele the action the girl is performing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the girl jumping with a man playing ukulele?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the girl dancing with a man playing ukulele?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the girl recording the man playing the ukulele?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1107180099": { "action": [ { "question": "Are the women dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the women engaged in dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does dancing describe the primary action of the group of women?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the women singing?", "gt-answer": "no", "video-llm-prediction": "No, the women are not singing. They are performing a dance routine on a basketball court.", "match_success": true, "rating": 1 }, { "question": "Are the women painting?", "gt-answer": "no", "video-llm-prediction": "No, the women are not painting. They are performing a dance routine on a basketball court.", "match_success": true, "rating": 1 }, { "question": "Are the women cooking?", "gt-answer": "no", "video-llm-prediction": "No, the women are not cooking. They are performing a dance routine on a basketball court.", "match_success": true, "rating": 1 } ] }, "1049434159": { "action": [ { "question": "Are the parents and daughter playing video games?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the parents and daughter engaged in playing video games?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Do the parents and daughter participate in a activity of playing video games?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the parents and daughter cooking dinner?", "gt-answer": "no", "video-llm-prediction": "No, the video shows the family playing video games together.", "match_success": true, "rating": 1 }, { "question": "Are the parents and daughter hiking?", "gt-answer": "no", "video-llm-prediction": "No, the video does not show the family hiking. It only shows them playing video games together.", "match_success": true, "rating": 1 }, { "question": "Are the parents and daughter involved in dancing?", "gt-answer": "no", "video-llm-prediction": "Yes. The parents and daughter are seen dancing together in the video.", "match_success": true, "rating": 0 } ] }, "3402234027": { "action": [ { "question": "Is the cat eating food?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the cat engaged in the activity of eating food?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the cat performing the action of eating food on the ground?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the cat sleeping?", "gt-answer": "no", "video-llm-prediction": "No, the cat is not sleeping. It is eating the food on the ground.", "match_success": true, "rating": 1 }, { "question": "Is the cat playing with a toy?", "gt-answer": "no", "video-llm-prediction": "No, the cat is not playing with a toy. It is eating food from the ground.", "match_success": true, "rating": 1 }, { "question": "Is the cat climbing a tree?", "gt-answer": "no", "video-llm-prediction": "No, the cat is not climbing a tree. The video shows the cat eating cat food on the ground.", "match_success": true, "rating": 1 } ] }, "1056491306": { "action": [ { "question": "Are the passengers taking a seat on the subway?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is taking a seat what the passengers are doing on the subway?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the passengers performing the action of taking a seat inside the subway?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Are the passengers sleeping on the bed?", "gt-answer": "no", "video-llm-prediction": "No, the passengers are not sleeping on the bed. They are sitting on the bed and looking at their phones.", "match_success": true, "rating": 1 }, { "question": "Are the passengers standing in a room?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Are the passengers dancing on the stage?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1012085909": { "action": [ { "question": "Are the people pushing bikes up a hill?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people moving by pushing bikes?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is pushing bikes the main activity of the people?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Are the people rolling boats on the lake?", "gt-answer": "no", "video-llm-prediction": "No, the people are not rolling boats on the lake. They are riding bikes on a dirt road.", "match_success": true, "rating": 1 }, { "question": "Are the people walking on the street?", "gt-answer": "no", "video-llm-prediction": "No, the people are not walking on the street. They are riding bicycles on a dirt road.", "match_success": true, "rating": 1 }, { "question": "Are the people swimming?", "gt-answer": "no", "video-llm-prediction": "No, the people are not swimming. They are riding bikes on a dirt road.", "match_success": true, "rating": 1 } ] }, "1079406734": { "action": [ { "question": "Is the man washing the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in washing the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is washing the car the activity the man is engaged in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man riding bikes?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is the man feeding a dog?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 }, { "question": "Is dancing the activity the man is engaged in?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1022115337": { "order": [ { "question": "Is the video showing dancing and then sending an air kiss?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Does dancing occur before sending an air kiss?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does sending an air kiss occur after dancing?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the video showing sending an air kiss and then dancing?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Does sending an air kiss occur before dancing?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does dancing occur after sending an air kiss?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1071214909": { "action": [ { "question": "Is the person drawing a cutting line?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the action performed by the person about drawing a cutting line on a wood surface?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the video about drawing a cutting line on a wood surface?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person carving a design?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the action performed by the person about erasing a line on a wood surface?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the video about measuring length on a wood surface?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1092065543": { "action": [ { "question": "Is the man shopping?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man engaged in the activity of shopping?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "In the video, can we see the man shopping?", "gt-answer": "yes", "video-llm-prediction": "Yes, we can see the man shopping in the video.", "match_success": true, "rating": 1 }, { "question": "Is the man eating?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the man gardening?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "In the video, can we see the man dancing?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 } ] }, "1017063703": { "action": [ { "question": "Is the person decorating cakes in the video?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the action demonstrated in the video about decorating cakes?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is decorating cakes the task being performed in the footage?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the person baking cakes in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is cutting cakes the task being performed in the footage?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is presenting cakes to guests the action demonstrated in the video?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1055022287": { "action": [ { "question": "Is the man cleaning a swimming pool?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is cleaning a swimming pool the activity being performed by the man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is cleaning a swimming pool the action that the man is undertaking?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man cooking?", "gt-answer": "no", "video-llm-prediction": "No, the man is not cooking. He is cleaning a pool with a hose.", "match_success": true, "rating": 1 }, { "question": "Is playing basketball the activity being performed by the man?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is reading the action that the man is undertaking?", "gt-answer": "no", "video-llm-prediction": "No", "match_success": true, "rating": 1 } ] }, "1094259081": { "action": [ { "question": "Is the woman playing VR shooting game?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the woman engaged in playing VR shooting game?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is playing VR shooting game the activity the woman is participating in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the woman watching VR movie?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman listening to music using VR?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the woman working out using VR?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1022260408": { "action": [ { "question": "Is the squirrel eating food?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the squirrel about eating food?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is eating food one of the actions performed by the squirrel?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the squirrel sleeping?", "gt-answer": "no", "video-llm-prediction": "No.", "match_success": true, "rating": 1 }, { "question": "Is the activity of the squirrel about chasing its tail?", "gt-answer": "no", "video-llm-prediction": "No, the squirrel is not chasing its tail. It is eating something from a tree.", "match_success": true, "rating": 1 }, { "question": "Is climbing a tree one of the actions performed by the squirrel?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1089810969": { "action": [ { "question": "Does the little girl run towards the woman and hug her?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the little girl running towards a woman and hugging her?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the action of running towards a woman and hugging her performed by the little girl?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the little girl walk towards the woman and hug her?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the little girl jumping on the woman's back?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Does the little girl run towards the woman and talk to her?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "6165731": { "action": [ { "question": "Is the scientist looking confused and frustrated about the experiment?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the scientist feel confused and frustrated about the experiment?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the emotional state of the scientist during the experiment confused and frustrated?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the scientist observing quietly on the experiment?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the scientist leisurely conducting experiments?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is the scientist bored and disinterested about the experiment?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "1111469465": { "action": [ { "question": "Is the man raising his arm to look at the watch looking anxious?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is the man's action about raising his arm to look at the watch looking anxious?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Does the video show the man raising his arm to look at the watch looking anxious?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the man raising his arm to look at the watch looking happy?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the man raising his arm to look at the watch looking calm?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the man putting his hands in his pockets looking anxious?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 } ] }, "1050000214": { "action": [ { "question": "Is the little child water jumping?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the little child performing the action of water jumping?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Is water jumping the action that the little child is engaged in?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is the little child running?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 }, { "question": "Is the little child eating?", "gt-answer": "no", "video-llm-prediction": "No, the little child is not eating. He is playing in the water and splashing around.", "match_success": true, "rating": 1 }, { "question": "Is the little child swimming?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] }, "27537016": { "order": [ { "question": "Did the man show off his car key and then pull back inside the car?", "gt-answer": "yes", "video-llm-prediction": "Yes.", "match_success": true, "rating": 1 }, { "question": "Was showing off his car key followed by pulling back inside the car?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Is showing off his car key and then pulling back inside the car the correct sequence of events involving the man?", "gt-answer": "yes", "video-llm-prediction": "Yes", "match_success": true, "rating": 1 }, { "question": "Did the man pull back inside the car and then show off his car key?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Was pulling back inside the car followed by showing off his car key?", "gt-answer": "no", "video-llm-prediction": "Yes", "match_success": true, "rating": 0 }, { "question": "Is throwing away his car key and then pulling back inside the car the correct sequence of events involving the man?", "gt-answer": "no", "video-llm-prediction": "Yes.", "match_success": true, "rating": 0 } ] } } }