{
"v2_0": {
"question": "What is x in the equation?v2_0_0.png",
"answer": "-1-5",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_1": {
"question": "What is d in the last equation?v2_1_0.png",
"answer": "1.25=1.255/4",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_2": {
"question": "What is x in the equation?v2_1_0.png",
"answer": "0.75=0.753/4",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_3": {
"question": "What is the answer to the bottom left equation?v2_3_0.png",
"answer": "12=12",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_4": {
"question": "What is the answer to the second equation on the right?v2_3_0.png",
"answer": "7=7",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_5": {
"question": "What is the answer to the second last equation on the right?v2_5_0.png",
"answer": "2=2",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_6": {
"question": "What is y in the last equation?v2_5_0.png",
"answer": "5=5",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_7": {
"question": "Find the pattern of how the \"X\" operator is redefined, and answer the given equation in the image.v2_7_0.png",
"answer": "13=13",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_8": {
"question": "What will the girl on the right write on the board?v2_8_0.png",
"answer": "14=14",
"capability": [
"rec",
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_9": {
"question": "How many gallons of supreme gasoline can I get with $50?v2_9_0.png",
"answer": "13.613.7",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_10": {
"question": "What is the price difference between diesel and regular gasoline?v2_9_0.png",
"answer": "0.11",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_11": {
"question": "What is the total price for a bottle of Merlot and a bottle of Cabernet shown in the image?v2_11_0.jpg",
"answer": "249.98",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_12": {
"question": "What is the cost of three bottles of Moet champagne?v2_11_0.jpg",
"answer": "344.97",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_13": {
"question": "I am getting one funghi pizza and one prosciutto pizza. How much should I pay in total?v2_13_0.jpg",
"answer": "14.814,8",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_14": {
"question": "I am getting two margherita pizza and one calzone. How much should I pay in total?v2_13_0.jpg",
"answer": "25.825,8",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_15": {
"question": "What is the original price for pork belly before discount?v2_15_0.png",
"answer": "14",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_16": {
"question": "What is the gasoline price?v2_16_0.jpg",
"answer": "4.2994.3",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_17": {
"question": "What is the color of the hat worn by the person in the front left?v2_17_0.jpg",
"answer": "blue",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_18": {
"question": "What is located to the right of the shampoo?v2_18_0.jpg",
"answer": "conditioner",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_19": {
"question": "What is in the right most bottle?v2_18_0.jpg",
"answer": "mousse",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_20": {
"question": "What is the spatial relation between the frisbee and the man?v2_20_0.jpg",
"answer": "above the mantop left",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_21": {
"question": "Which car is on the parking spot 33?v2_21_0.jpg",
"answer": "noempty",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_22": {
"question": "Which spot is the red car parking on?v2_21_0.jpg",
"answer": "31",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_23": {
"question": "What is the price for tomatoes?v2_23_0.png",
"answer": "eight8.0",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_24": {
"question": "What fruit is the the right of plums?v2_23_0.png",
"answer": "orange",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_25": {
"question": "Based on the image, what is the total international awareness of Tina Fey?v2_25_0.png",
"answer": "35%",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_26": {
"question": "Based on the image, in which country does Tina Fey have the highest level of total awareness?v2_25_0.png",
"answer": "Australia",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_27": {
"question": "What earth's interior structure does number 2 indicate?v2_27_0.png",
"answer": "mantle",
"capability": [
"ocr",
"know",
"spat"
],
"added_in": "v1"
},
"v2_28": {
"question": "What is the number displayed on the motorcycle ridden by the motorcyclist wearing a yellow suit?v2_28_0.jpg",
"answer": "16",
"capability": [
"rec",
"ocr"
],
"added_in": "v1"
},
"v2_29": {
"question": "What is the number displayed on the motorcycle on the right?v2_28_0.jpg",
"answer": "4",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_30": {
"question": "Are which one of these two jets are larger in size?v2_30_0.jpg",
"answer": "same",
"capability": [
"rec",
"know",
"spat"
],
"added_in": "v1"
},
"v2_31": {
"question": "Is the person bigger than the car?v2_31_0.png",
"answer": "no",
"capability": [
"rec",
"know",
"spat"
],
"added_in": "v1"
},
"v2_32": {
"question": "What should I do after kneading the dough, before dividing it into pieces?v2_32_0.png",
"answer": "warm place1 hour",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_33": {
"question": "Should I add sugar when mixing egg and milk?v2_33_0.png",
"answer": "no",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_34": {
"question": "What should I do before cutting herbs, sausage, and mushrooms?v2_34_0.jpg",
"answer": "tilt pan slightly",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_35": {
"question": "What is the index of the step when we need to add all purpose flour?v2_35_0.png",
"answer": "third 3",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_36": {
"question": "What should we add in the third step?v2_36_0.jpg",
"answer": "milk",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_37": {
"question": "What should kids do after snap fingers?v2_37_0.jpg",
"answer": "hop on one foot",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_38": {
"question": "What should be drawn in the fourth step?v2_38_0.jpg",
"answer": "nose",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_39": {
"question": "What is the step after using probe to spread tire puncture?v2_39_0.jpg",
"answer": "remove the repair",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_40": {
"question": "What is the second step suggested?v2_40_0.png",
"answer": "identify your audience",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_41": {
"question": "What is the last strategy given in the image?v2_41_0.png",
"answer": "make a song",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_42": {
"question": "What is the average total fueling cost excluding the Ford F150?v2_42_0.png",
"answer": "76.5576.56",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_43": {
"question": "What is the highest fueling cost?v2_42_0.png",
"answer": "130.96",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_44": {
"question": "Which category did the worst job in plastic recycling, considering the amount of plastic made and thrown out?v2_44_0.png",
"answer": "packaging",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_45": {
"question": "What is the difference in metric tonnes between the amount of plastic produced and the amount discarded?v2_44_0.png",
"answer": "105",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_46": {
"question": "What is the estimated average standing charge for the year 2023?v2_46_0.png",
"answer": "271",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_47": {
"question": "What is the estimated total cost for the year 2023?v2_46_0.png",
"answer": "23800",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_48": {
"question": "In which direction does the living room window face?v2_48_0.jpg",
"answer": "north",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_49": {
"question": "What are the appliances in the kitchen in this floorplan?v2_49_0.jpg",
"answer": "ovendishwasher",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_50": {
"question": "Which room is bigger, the double garage or the living room?v2_50_0.jpg",
"answer": "double garage",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_51": {
"question": "Which room is bigger, the master bedroom or the patio?v2_50_0.jpg",
"answer": "master bedroom",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_52": {
"question": "What is the solution if the lamp is plugged in and the bulb has burned out?v2_52_0.png",
"answer": "replace blub",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_53": {
"question": "Which step in the flowchart is drawn with a diamond shape?v2_53_0.png",
"answer": "water boiled?",
"capability": [
"rec",
"ocr"
],
"added_in": "v1"
},
"v2_54": {
"question": "What is the average wait time to climb out of bed?v2_54_0.png",
"answer": "15 min",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_55": {
"question": "Which year has the highest growth rate of median house price?v2_55_0.png",
"answer": "2008",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_56": {
"question": "What is Japan's gdp in 2012?v2_56_0.png",
"answer": "6,233.15 billion U.S. dollars",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_57": {
"question": "In which years did rowing and athletics have the same number of gold medals?v2_57_0.jpg",
"answer": "20002012",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_58": {
"question": "Which department is the person who has the highest salary from?v2_58_0.png",
"answer": "Administration",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_59": {
"question": "Based on the table, how much is Wilkins earning?v2_58_0.png",
"answer": "25002,500",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_60": {
"question": "Which country has a below-average profit margin?v2_60_0.png",
"answer": "India",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_61": {
"question": "Which country has the highest profit margin?v2_60_0.png",
"answer": "Australia",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_62": {
"question": "In which month is the highest income generated?v2_62_0.png",
"answer": "Feb",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_63": {
"question": "What percentage does salary contribute to total income?v2_62_0.png",
"answer": "56.20.562",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v1"
},
"v2_64": {
"question": "Who is the person on the left?v2_64_0.png",
"answer": "Keira Knightley",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_65": {
"question": "Who is the person in the image?v2_65_0.png",
"answer": "Michelle Yeoh",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_66": {
"question": "Who is the person in the bottom right?v2_66_0.jpg",
"answer": "Jamie Dornan",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_67": {
"question": "Which one is unsweetened?v2_67_0.png",
"answer": "oat",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_68": {
"question": "Is this apple organic?v2_68_0.png",
"answer": "yes",
"capability": [
"rec",
"ocr"
],
"added_in": "v1"
},
"v2_69": {
"question": "What is the calories for the entire bag?v2_69_0.jpg",
"answer": "275",
"capability": [
"ocr",
"math"
],
"added_in": "v1"
},
"v2_70": {
"question": "What is the name of this dish?v2_70_0.png",
"answer": "mapo tofu",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_71": {
"question": "What is the name of this dish?v2_71_0.jpg",
"answer": "Caprese Salad",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_72": {
"question": "What is the name of this dish?v2_72_0.png",
"answer": "pad thai",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_73": {
"question": "What is the make of the car on the left?v2_73_0.jpg",
"answer": "volkswagen",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_74": {
"question": "What does this factory make?v2_74_0.jpg",
"answer": "camera",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_75": {
"question": "what is the green logo on the car?v2_75_0.jpg",
"answer": "monster",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_76": {
"question": "What is the name of this landmark?v2_76_0.png",
"answer": "Trevi Fountain",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_77": {
"question": "What is the name of this landmark?v2_77_0.jpg",
"answer": "Anbariya Mosque",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_78": {
"question": "What is the name of this landmark?v2_78_0.jpg",
"answer": "baochu pagoda",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_79": {
"question": "What is the face value of this banknote?v2_79_0.jpg",
"answer": "five 5",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_80": {
"question": "What is this banknote?v2_80_0.jpg",
"answer": "ten pound10 poundBritish pound",
"capability": [
"rec",
"ocr"
],
"added_in": "v1"
},
"v2_81": {
"question": "What type of currency does this banknote represent?v2_81_0.jpg",
"answer": "SwedeKronor",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_82": {
"question": "Which chest xray disease can be found? (Options include: Atelectasis; Cardiomegaly; Effusion; Infiltration; Mass; Nodule; Pneumonia; Pneumothorax; Consolidation; Edema; Emphysema; Fibrosis; Pleural Thickening; Hernia.)v2_82_0.png",
"answer": "Cardiomegaly",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_83": {
"question": "Which chest xray disease can be found? (Options include: Atelectasis; Cardiomegaly; Effusion; Infiltration; Mass; Nodule; Pneumonia; Pneumothorax; Consolidation; Edema; Emphysema; Fibrosis; Pleural Thickening; Hernia.)v2_83_0.png",
"answer": "Hernia",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_84": {
"question": "Which chest xray disease can be found? (Options include: Atelectasis; Cardiomegaly; Effusion; Infiltration; Mass; Nodule; Pneumonia; Pneumothorax; Consolidation; Edema; Emphysema; Fibrosis; Pleural Thickening; Hernia.)v2_84_0.png",
"answer": "Infiltration",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_85": {
"question": "How many birds are there?v2_85_0.jpg",
"answer": "6",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_86": {
"question": "How many tomatoes are there?v2_86_0.jpg",
"answer": "5",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_87": {
"question": "How many books are there?v2_87_0.jpg",
"answer": "63",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_88": {
"question": "What are all the scene text in the image?v2_88_0.jpg",
"answer": "S3302CD",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_89": {
"question": "What are all the scene text in the image?v2_89_0.jpg",
"answer": "Luxmi Jewellers",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_90": {
"question": "What are all the scene text in the image?v2_90_0.jpg",
"answer": "have yourself a merry little Christmas",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_91": {
"question": "What are all the scene text in the image?v2_91_0.jpg",
"answer": "5:30PM88%Mario Kart 8 DeluxeMARIO KART 8 DELUXESUPER MARIO ODYSSEYTHE LEGEND OF ZELDABREATH OF WILDOptionsStart",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_92": {
"question": "What are all the scene text in the image?v2_92_0.jpg",
"answer": "MR. WILLIAM SHAKESPEARESCOMEDIES, HISTORIES, & TRAGEDIES.publifhed according to the True Originall Copies.",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_93": {
"question": "What are all the scene text in the image?v2_93_0.jpg",
"answer": "Connecticut law of 1642If any man or woman be a witch -- that is, hath or consulteth with a familiar spirit -- they shall be put to death",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_94": {
"question": "What is the brand of this device?v2_94_0.jpg",
"answer": "MOTOROLA",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_95": {
"question": "What is the license plate number?v2_95_0.jpg",
"answer": "AED-632",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_96": {
"question": "What are all the French scene text in the image?v2_96_0.jpg",
"answer": "HISTOIRE DE FRANCEDe La pr\u00e9histoire \u00e0 ans joursQueelle Histoire",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_97": {
"question": "What are all the Chinese scene text in the image?v2_97_0.jpg",
"answer": "\u9a6c\u66f3\u8457\u6bcf\u4e2a\u4eba\u90fd\u6709\u81ea\u5df1\u7684\u56f0\u5883\u4f46\u603b\u4f1a\u88ab\u5149\u4eae\u5438\u5f15\u8eab\u4e0d\u7531\u5df1\u5730\u6162\u6162\u9760\u8fd1",
"capability": [
"ocr"
],
"added_in": "v1"
},
"v2_98": {
"question": "Which continent is highlighted?v2_98_0.jpg",
"answer": "Asia",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_99": {
"question": "Which are producers in this food web?v2_99_0.png",
"answer": "PhytoplanktonSeaweed",
"capability": [
"ocr",
"know",
"spat"
],
"added_in": "v1"
},
"v2_100": {
"question": "Compare the average kinetic energies of the particles in each sample. The diagrams below show two pure samples of gas in identical closed, rigid containers. Each colored ball represents one gas particle. Both samples have the same number of particles. Which sample has the higher temperature? Sample A or sample B?v2_100_0.png",
"answer": "sample A",
"capability": [
"ocr",
"know",
"spat"
],
"added_in": "v1"
},
"v2_101": {
"question": "Which of these highlighted cities is the farthest north?v2_101_0.png",
"answer": "CHICAGO",
"capability": [
"ocr",
"spat"
],
"added_in": "v1"
},
"v2_102": {
"question": "Where is this photo taken?v2_102_0.png",
"answer": "turkeysyria",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_103": {
"question": "Where is this photo taken?v2_103_0.png",
"answer": "oscar2023",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_104": {
"question": "Where is this photo taken?v2_104_0.png",
"answer": "qatar",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_105": {
"question": "In which country was this photo taken?v2_105_0.png",
"answer": "australia",
"capability": [
"rec",
"know"
],
"added_in": "v1"
},
"v2_106": {
"question": "Are the trees taller than the giraffes?v2_106_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_107": {
"question": "Is this airplane taking off or landing?v2_107_0.jpg",
"answer": "taking off",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_108": {
"question": "How many people are sitting down?v2_108_0.jpg",
"answer": "one",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_109": {
"question": "Is the trash empty or full?v2_109_0.jpg",
"answer": "empty",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_110": {
"question": "Does the giraffe appear dangerous?v2_110_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_111": {
"question": "Is there any reflection of zebra in water?v2_111_0.jpg",
"answer": "yes",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_112": {
"question": "Is the man happy?v2_112_0.jpg",
"answer": "yes",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_113": {
"question": "Are all of the cats the same color?v2_113_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_114": {
"question": "Is that wine in the background?v2_114_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_115": {
"question": "Is the man going to fall down?v2_115_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_116": {
"question": "What place is pictured?v2_116_0.jpg",
"answer": "shore",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_117": {
"question": "Is it outdoors?v2_117_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_118": {
"question": "How's the weather?v2_118_0.jpg",
"answer": "clearsunny",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_119": {
"question": "What is the color of the fence made of metal?v2_119_0.jpg",
"answer": "green",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_120": {
"question": "Does the person to the left of the man appear to be sitting?v2_120_0.jpg",
"answer": "yes",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_121": {
"question": "Is the plate of the table both dirty and silver?v2_121_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_122": {
"question": "Is the curtain on the right side or on the left of the picture?v2_122_0.jpg",
"answer": "left",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_123": {
"question": "Is there a computer in this photo?v2_123_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_124": {
"question": "Are there napkins under the utensil to the left of the rice?v2_124_0.jpg",
"answer": "yes",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_125": {
"question": "Are there nuts or vegetables?v2_125_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_126": {
"question": "Are there both plates and forks in this picture?v2_126_0.jpg",
"answer": "yes",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_127": {
"question": "What is this bird called?v2_127_0.jpg",
"answer": "parrotconure",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_128": {
"question": "Which animal in the picture is larger, the cat or the dog?v2_128_0.jpg",
"answer": "cat",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_129": {
"question": "On the right desk, what is to the left of the laptop? v2_129_0.jpg",
"answer": "table lampdesk lamp",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_130": {
"question": "Does the man ride a horse?v2_130_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_131": {
"question": "Is the surfer to the left or to the right of the surfboard?v2_131_0.jpg",
"answer": "left",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_132": {
"question": "What is the lamp on, a side table or a nightstand?v2_132_0.jpg",
"answer": "side table",
"capability": [
"rec",
"spat"
],
"added_in": "v1"
},
"v2_133": {
"question": "What do both the stump and the fence have in common?v2_133_0.jpg",
"answer": "material",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_134": {
"question": "Is the spoon made of the same material as the chopsticks?v2_134_0.jpg",
"answer": "yes",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_135": {
"question": "Does the shirt have a different color than the kite?v2_135_0.jpg",
"answer": "yes",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_136": {
"question": "Do all these people have the same gender?v2_136_0.jpg",
"answer": "no",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_137": {
"question": "Are these two animals different species?v2_137_0.jpg",
"answer": "yes",
"capability": [
"rec"
],
"added_in": "v1"
},
"v2_138": {
"question": "Where are the persons? Answer it and give the rationale.v2_138_0.jpg",
"answer": "They are in a college classroom. I think so because he young woman appears to be college age, and they are surrounded by desks and chairs.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_139": {
"question": "Why are the persons wearing black clothes? Answer it and give the rationale.v2_139_0.jpg",
"answer": "They are going to a funeral. I think so because it is traditional for people to wear black to a funeral.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_140": {
"question": "Why is the woman wearing a robe? Answer it and give the rationale.v2_140_0.jpg",
"answer": "She is getting ready for bed. I think so because The room appears to be a bedroom and the woman is headed in the general direction of her bed.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_141": {
"question": "Where is this happening? Answer it and give the rationale.v2_141_0.jpg",
"answer": "This is happening in a fancy restaurant. I think so because the man is dressed fancily and the background is fancy.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_142": {
"question": "Is it summertime in the scene? Answer it and give the rationale.v2_142_0.jpg",
"answer": "No, it looks to be fall. I thinks so because there are pumpkins in the background and they are normally associated with fall.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_143": {
"question": "Is the woman in red going to be mad at the man, for looking at the woman in dress? Answer it and give the rationale.v2_143_0.jpg",
"answer": "Yes, the woman in red and the man appear to be a couple and the woman in red would not appreciate the man checking out other women.I think so because in a monogamous relationship, partners are expected to be faithful to one another.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_144": {
"question": "Why does the woman have both of her hands in the air? Answer it and give the rationale.v2_144_0.jpg",
"answer": "She just shot a basketball. I think so because Her arms are angled for a basketball shot and they are in a basketball arena.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_145": {
"question": "What kind of school does the boy go to? Answer it and give the rationale.v2_145_0.jpg",
"answer": "The boy goes to a private school, not a public school. I think so because the boy is all dressed up in a suit, public schools don't require that but some private schools do.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_146": {
"question": "Do the persons live in this house? Answer it and give the rationale.v2_146_0.jpg",
"answer": "No they do not. I think so because they are all looking around at the paintings and decorations, which one would not do if they were used to seeing them.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_147": {
"question": "Why are the man and woman in white so close to each other? Answer it and give the rationale.v2_147_0.jpg",
"answer": "They just got married. I think so because they're in wedding clothing and everyone is looking at them.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_148": {
"question": "Can you explain this meme?v2_148_0.jpg",
"answer": "This meme is a humorous take on procrastination and the tendency to delay tasks until a specific time. The person in the meme plans to do something at 8 o'clock, but when they miss that deadline by a few minutes, they decide to wait until 9 o'clock instead. The image of Kermit the Frog lying in bed represents the person's laziness and lack of motivation to complete the task.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_149": {
"question": "Can you explain this meme?v2_149_0.jpg",
"answer": "This meme is a commentary on the current situation of online learning due to the COVID-19 pandemic. It shows how different parties are affected by it.\n\nThe first two images show the Zoom company and the teachers throwing money in the air, which implies that they are profiting from the situation. Zoom, in particular, has seen a surge in usage and revenue due to the pandemic.\n\nThe third image shows the WiFi company also throwing money in the air, which implies that they are also profiting from the situation as more people are using the internet for online learning.\n\nThe last image shows a student with a sad clown face, which implies that students are not benefiting from the situation and are struggling with online learning. The \"Put on a happy face\" sign in the background further emphasizes the idea that students are putting on a brave face despite their struggles.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_150": {
"question": "Can you explain this meme?v2_150_0.jpg",
"answer": "This meme is poking fun at the fact that the names of the countries Iceland and Greenland are misleading. Despite its name, Iceland is known for its beautiful green landscapes, while Greenland is mostly covered in ice and snow. The meme is saying that the person has trust issues because the names of these countries do not accurately represent their landscapes.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_151": {
"question": "Can you explain this meme?v2_151_0.jpg",
"answer": "This meme is poking fun at how a student's handwriting deteriorates during an exam. The first two pages show neat and legible handwriting, the middle page shows slightly messier handwriting, and the last two pages show completely illegible scribbles. This is likely due to the student becoming tired or rushed as the exam progresses.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_152": {
"question": "Can you explain this meme?v2_152_0.jpg",
"answer": "This meme is a joke about how new college students (freshmen) are often eager to take notes and learn everything they can in class. The image is from the cartoon SpongeBob SquarePants, where SpongeBob and Patrick are frantically writing down notes. The caption implies that the freshmen are so eager to learn that they are even writing down the professor's greeting.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_153": {
"question": "What is funny about this image?v2_153_0.jpg",
"answer": "It is a cartoon of a rhinoceros painting a picture and each picture has its rhino horn because the rhino horn grows in front of its eyes. The caption \"You see the world as you are!\" is a playful commentary on how our perspective shapes our perception of the world.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_154": {
"question": "What is funny about this image?v2_154_0.png",
"answer": "There are a few things that people might find funny about this image:\n\n1. The contrast between the two images: On the left, we see two women who are very emotional and angry, while on the right, we see a cat who is calmly sitting at a dinner table.\n\n2. The absurdity of the cat's situation: It is not common to see a cat sitting at a dinner table with a plate of food in front of it, so this image is unexpected and ridiculous.\n\n3. The cat's expression: The cat appears to be frightened by the women's yelling, which adds to the humor of the image.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_155": {
"question": "What occasions would someone use this meme?v2_155_0.png",
"answer": "The meme with the sleepy man and the Chinese caption \"\u9664\u4e86\u7761\u89c9\u65f6\u95f4\u4e0d\u60f3\u7761\u89c9\u5176\u4ed6\u65f6\u95f4\u90fd\u60f3\u7761\u89c9\" (Except during sleep time, I don't want to sleep. But during other times, I want to sleep) can be used in various occasions where the theme of feeling sleepy or having conflicting desires is relevant. Here are a few scenarios where this meme could be fitting:\n\n Relatable sleepiness: The meme can be shared on social media or in conversations when expressing the relatable feeling of being tired or sleepy during the day. It can serve as a lighthearted way to convey that relatable experience and generate a humorous response from others who can relate.\n\n Work or study-related humor: This meme can be used in work or study-related contexts to humorously express the desire to sleep or feeling drowsy during tasks that require attentiveness and focus. It can be shared among colleagues or classmates to lighten the mood and create a shared understanding of the challenges of staying awake and alert.\n\n Procrastination humor: The meme can also be used to depict the internal struggle between wanting to sleep or rest instead of engaging in productive activities. It can be shared when discussing procrastination or humorous self-reflections on the constant desire to avoid responsibilities and indulge in relaxation.\n\n Comedic irony: The meme's contradiction between sleep time and wanting to sleep at other times can be used as a form of comedic irony in various contexts. It can be shared when discussing situations where our desires or behaviors contradict what is expected or appropriate, adding a humorous twist to the conversation.\n\nUltimately, the meme can be employed in different situations where its theme of sleepiness, conflicting desires, or ironic situations aligns with the topic or sentiment being discussed, adding a touch of humor and relatability to the conversation or online interaction.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_156": {
"question": "What occasions would someone use this meme?v2_156_0.jpg",
"answer": "This meme, commonly known as \"Screaming Panda,\" is typically used to express shock, surprise, or fear. It could be used in response to a startling or unexpected event, or to convey a sense of panic or alarm. Some possible occasions where someone might use this meme include:\n\n- Reacting to a jump scare in a horror movie\n- Responding to a surprising plot twist in a TV show or book\n- Expressing shock at a news headline or current event\n- Conveying fear or anxiety about an upcoming deadline or exam\n- Showing surprise at an unexpected outcome in a sports game or other competition.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_157": {
"question": "What occasions would someone use this meme?v2_157_0.jpg",
"answer": "The \"crying cat\" meme with the Chinese caption \"Mom!\" is typically used to express a sense of distress, helplessness, or seeking comfort. Here are some occasions where someone might use this meme:\n\n Expressing vulnerability: The meme can be used to express a moment of vulnerability or when feeling overwhelmed. It can convey a sense of seeking support or empathy from others by humorously invoking the idea of calling out for one's mother.\n\n Seeking comfort or sympathy: This meme can be shared to evoke sympathy or support from friends or online communities. By using a relatable and recognizable meme format, it can effectively communicate feelings of sadness, disappointment, or needing emotional support.\n\n Self-deprecating humor: The meme can also be used in a self-deprecating manner to make light of personal situations or minor mishaps. It allows individuals to humorously highlight their own moments of perceived \"helplessness\" while inviting others to provide comfort or reassurance.\n\n Playful emotional exaggeration: The meme's dramatic and exaggerated expression can be used in a playful manner to emphasize a situation or event that is not necessarily distressing but may require attention or care. It can add a humorous touch when expressing minor inconveniences or humorous hyperbole.\n\nIt's important to note that meme usage and interpretation can vary, and individuals may find creative ways to adapt it to different contexts. The suggested occasions above provide a general understanding of when this meme could be used based on its common themes and emotional tone.",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v1"
},
"v2_158": {
"question": "How to cook this dish?v2_158_0.jpg",
"answer": "The dish is called \"Hungarian Mushroom Soup\". This Hungarian mushroom soup has lots of flavor and is fairly quick to make. It's primarily a mushroom soup but derives a lot of its flavor from other ingredients. My family loves soup and this is one of their favorites.\n\n\nPrep Time:\n15 mins\nCook Time:\n35 mins\nTotal Time:\n50 mins\nServings:\n6\n\n\n Ingredients\n\n 4 tablespoons unsalted butter\n\n 2 cups chopped onions\n\n 1 pound fresh mushrooms, sliced\n\n 2 cups chicken broth\n\n 1 tablespoon soy sauce\n\n 1 tablespoon paprika\n\n 2 teaspoons dried dill weed\n\n 1 cup milk\n\n 3 tablespoons all-purpose flour\n\n \u00bd cup sour cream\n\n \u00bc cup chopped fresh parsley\n\n 2 teaspoons lemon juice\n\n 1 teaspoon salt\n\n ground black pepper to taste\n\n\n Directions\n\nStep1\n Melt butter in a large pot over medium heat. Add onions; cook and stir until softened, about 5 minutes. Add mushrooms and saut\u00e9 for 5 more minutes. Stir in broth, soy sauce, paprika, and dill; reduce heat to low, cover, and simmer for 15 minutes.\n\nstep2\n Whisk milk and flour together in a separate bowl; stir into soup until blended. Cover and simmer for 15 more minutes, stirring occasionally.\n\nStep3\n Add sour cream, parsley, lemon juice, salt, and ground black pepper; stir over low heat until warmed through, about 3 to 5 minutes. Serve immediately. ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_159": {
"question": "How to make this?v2_159_0.jpg",
"answer": "This is called \"Sparkling Cantaloupe Agua Fresca\". This refreshing agua fresca with cantaloupe and lime juice topped with club soda is perfect on a hot day.\n\nPrep Time:\n15 mins\nTotal Time:\n15 mins\nServings:\n8\n\n Ingredients\n\n 2 pounds fresh cantaloupe cubes (6 cups)\n\n 2 cups water\n\n 6 tablespoons freshly squeezed lime juice (from 2 limes)\n\n 3 tablespoons honey\n\n 1/4 teaspoon salt\n\n 2 cups club soda, chilled\n\n cantaloupe melon balls or cubes, for garnish \n\n lime zest twists, for garnish\n\n\n Directions\n\nStep 1\n Working in batches if needed, blend cantaloupe, water, lime juice, honey, and salt in a blender until smooth. Press through a sieve; discard solids. Add strained juice to a pitcher.\n\nStep 2\n Chill until ready to serve. Add club soda just before serving. Serve over ice, and garnish glasses with melon balls and lime zest twists. ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_160": {
"question": "How to cook this dish?v2_160_0.jpg",
"answer": "This dish is called \"Ginger Glazed Mahi Mahi\". This ginger sauce for mahi mahi is bursting with flavor and combines both sweet and sour taste sensations. This recipe is a snap and so delicious. You'll love it! \n\n\nPrep Time:\n5 mins\nCook Time:\n10 mins\nAdditional Time:\n20 mins\nTotal Time:\n35 mins\nServings:\n4\n\n Ingredients\n\n 3 tablespoons honey\n\n 3 tablespoons soy sauce\n\n 3 tablespoons balsamic vinegar\n\n 2 teaspoons olive oil\n\n 1 teaspoon grated fresh ginger root\n\n 1 clove garlic, crushed or to taste\n\n 4 (6 ounce) mahi mahi fillets\n\n salt and pepper to taste\n\n 1 tablespoon vegetable oil\n\n\n Directions\n\nStep 1\n Mix honey, soy sauce, balsamic vinegar, olive oil, ginger, and garlic together in a shallow dish. Season fish fillets with salt and pepper; place them skin-sides down in the dish with marinade. Cover and refrigerate for 20 minutes.\n\nStep 2\n Heat vegetable oil in a large skillet over medium-high heat. Remove fish fillets, reserving marinade. Fry fish for 4 to 6 minutes on each side, turning only once, until fish flakes easily with a fork. Remove fillets to a serving platter and keep warm.\n\nStep 3\n Pour reserved marinade into the skillet; simmer over medium heat until reduced to a glaze. Spoon glaze over fish and serve. ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_161": {
"question": "How to cook this dish?v2_161_0.jpg",
"answer": "This dish is called \"Strawberry Rhubarb Pie\". This strawberry rhubarb pie is a favorite springtime dessert in our house. The filling has a sweet-tart flavor; bake in your favorite pie crust and serve with vanilla ice cream.\n\nPrep Time:\n20 mins\nCook Time:\n35 mins\nAdditional Time:\n30 mins\nTotal Time:\n1 hr 25 mins\nServings:\n8\nYield:\n1 9-inch pie\n\n Ingredients\n\n 1 cup white sugar\n\n \u00bd cup all-purpose flour\n\n 1 pound rhubarb, cut into 1/4 inch slices\n\n 2 pints strawberries, hulled and quartered\n\n 1 recipe pastry for a 9 inch double crust pie\n\n 2 tablespoons butter\n\n 1 large egg yolk\n\n 2 tablespoons white sugar\n\n Directions\n\nStep 1\n Preheat oven to 400 degrees F (200 degrees C).\n\nStep 2\n In a large bowl, mix flour and sugar. \n\nStep 3\n Add strawberries and chopped rhubarb. Toss with sugar and flour and let stand for 30 minutes. \n\nStep 4\n Pour filling into prepared pie crust. Dot top with butter, and cover with top crust. Seal edges of top and bottom crust with water. \n\nStep 5\n Apply yolk to top of pie, using a pastry brush. \n\nStep 6\n Sprinkle with sugar. \n\nStep 7\n Cut small holes in top to let steam escape. \n\nStep 8\n Bake at 400 degrees F (200 degrees C), for 35 to 40 minutes, or until bubbly and brown. Cool on rack. \n\nStep 9\n Enjoy! ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_162": {
"question": "How to cook this dish?v2_162_0.jpg",
"answer": "This dish is called \"Authentic Chinese Egg Rolls\". These Chinese egg rolls come from my mom who is the best cook ever \u2014 and I am a picky eater. If I like this, then you will. This is very authentic because my family is Chinese and I am too. This recipe is at least 300 years old in the Ling family.\n\n\nPrep Time:\n1 hr\nCook Time:\n30 mins\nAdditional Time:\n1 hr\nTotal Time:\n2 hrs 30 mins\nServings:\n20\nYield:\n20 egg rolls\n\n\n Ingredients\n\n 4 teaspoons vegetable oil, divided\n\n 3 large eggs, beaten\n\n 1 medium head cabbage, finely shredded\n\n \u00bd carrot, julienned\n\n 1 pound Chinese barbequed or roasted pork, cut into matchsticks\n\n 1 (8 ounce) can shredded bamboo shoots\n\n 1 cup dried, shredded wood ear mushroom, rehydrated\n\n 2 green onions, thinly sliced\n\n 2 \u00bd teaspoons soy sauce\n\n 1 teaspoon salt\n\n 1 teaspoon sugar\n\n \u00bd teaspoon monosodium glutamate (MSG)\n\n 1 (14 ounce) package egg roll wrappers\n\n 1 egg white, beaten\n\n 4 cups oil for frying, or as needed\n\n Directions\n\nStep 1\n Heat 1 teaspoon vegetable oil in a wok or large skillet over medium heat. Pour in beaten eggs and cook, without stirring, until firmed up. Flip eggs over and cook for an additional 20 seconds to firm the other side. Set egg pancake aside to cool, then slice into thin strips.\n\nStep 2\n Heat remaining vegetable oil in a wok or large skillet over high heat. Stir in cabbage and carrot; cook for 2 minutes to wilt. Add pork, bamboo shoots, mushroom, green onions, soy sauce, salt, sugar, and MSG; continue cooking until vegetables soften, about 6 minutes. Stir in sliced egg, then spread the mixture out onto a pan, and refrigerate until cold, about 1 hour.\n\nStep 3\n To assemble the egg rolls: Place a wrapper onto your work surface with one corner pointing towards you. Place about 3 tablespoons of cooled filling in a heap onto the bottom third of the wrapper. Brush a little beaten egg white onto the top two edges of the wrapper, then fold the bottom corner over the filling and roll firmly to the halfway point. Fold the left and right sides snugly over the egg roll, then continue rolling until the top corners seal the egg roll with the egg white. Repeat with remaining egg roll wrappers, covering finished egg rolls with plastic wrap to keep from drying out.\n\nStep 4\n Heat about 6 inches of oil in a wok or deep-fryer to 350 degrees F (175 degrees C).\n\nStep 5\n Fry egg rolls 3 or 4 at a time until golden brown, 5 to 7 minutes. Drain on paper towels. ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_163": {
"question": "How to cook this dish?v2_163_0.jpg",
"answer": "This dish is called \"Chocolate Coated Peanut Butter Crackers\".\n\nPrep Time:\n30 mins\nCook Time:\n5 mins\nAdditional Time:\n15 mins\nTotal Time:\n50 mins\nServings:\n40\nYield:\n40 sandwich cookies\n\n\nIngredients\n\u00be cup creamy or chunky peanut butter\n\n2 pounds chocolate almond bark, broken into pieces\n\n80 buttery round crackers (such as Ritz\u00ae)\n\n2 \u00bc ounces colored candy sprinkles (Optional)\n\n\nDirections\nStep 1\nSpread approximately 1 teaspoon peanut butter onto each cracker half. Press peanut butter sides together to form 40 peanut butter-filled sandwich cookies.\n\nStep 2\nMelt almond bark in the top of a double boiler over hot, but not boiling, water. Reduce heat and keep melted chocolate in top of double boiler over simmering water.\n\nStep 3\nDip each sandwich cookie into the melted chocolate, allowing excess to drain back into pot.\n\nStep 4\nPlace coated cookies onto waxed paper and immediately sprinkle with candy sprinkles so they adhere to the melted chocolate.\n\nStep 5\nPlace cookies in the refrigerator until chocolate has set, about 15 minutes.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_164": {
"question": "How to cook this dish?v2_164_0.jpg",
"answer": "This dish is called \"Broccoli and Carrot Stir Fry\".\n\nPrep Time:\n10 mins\nCook Time:\n16 mins\nTotal Time:\n26 mins\nServings:\n5\nYield:\n5 cups\n\nIngredients\n5 \u00bd cups broccoli florets\n\n1 carrot, thinly sliced\n\n2 teaspoons water\n\n1 teaspoon cornstarch\n\n1 teaspoon chicken bouillon granules, or to taste\n\nsalt to taste\n\n2 tablespoons peanut oil\n\nDirections\nStep 1\nBring a large pot of lightly salted water to a boil. Add broccoli and cook uncovered until bright green, about 2 minutes. Transfer broccoli to a bowl of ice water using a slotted spoon and immerse for several minutes to stop the cooking process. Drain.\n\nStep 2\nBring water back to a boil in the same large pot; add sliced carrot and cook for 1 minute. Drain.\n\nStep 3\nMix water and cornstarch together in a bowl until smooth. Add chicken granules and salt and mix well.\n\nStep 4\nHeat peanut oil in a wok or large skillet over high heat; saute broccoli and carrots for 2 minutes. Add cornstarch mixture; cook and stir until vegetables are coated evenly, 1 to 2 minutes.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_165": {
"question": "How to cook this dish?v2_165_0.jpg",
"answer": "This dish is called \"Cream Cheese and Crab Sushi Rolls\".\n\nPrep Time:\n20 mins\nCook Time:\n20 mins\nTotal Time:\n40 mins\nServings:\n2\nYield:\n2 sushi rolls\n\n\nIngredients\n1 cup uncooked white rice\n\n2 cups water\n\n2 tablespoons rice vinegar\n\n1 teaspoon salt\n\n2 sheets nori seaweed sheets\n\n\u00bc cucumber, peeled and sliced lengthwise\n\n2 pieces imitation crab legs\n\n\u00bd (3 ounce) package cream cheese, sliced\n\n1 teaspoon minced fresh ginger root\n\n\nDirections\nStep 1\nGather all ingredients.\nStep 2\nBring rice and water to a boil in a saucepan over high heat. Reduce heat to medium-low, cover, and simmer until the rice is tender, and the liquid has been absorbed, 20 to 25 minutes. Stir in rice vinegar and salt. Allow to cool completely.\nStep 3\nLay out seaweed sheets. Moisten hands with water, then spread cooled rice evenly on each sheet, leaving a 1/2-inch gap along one edge, lengthwise. Arrange strips of cucumber, imitation crabmeat, and cream cheese on top of the rice in a straight line along the side opposite the gap. Roll up sushi from the toppings to the seaweed sheet's exposed end.\nStep 4\nUsing a sharp wet knife, slice each roll into 5 or 6 pieces. Serve with minced ginger on the side.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_166": {
"question": "How to cook this dish?v2_166_0.jpg",
"answer": "This dish is called \"Vegan Sweet Potato Chickpea Curry\".\n\nPrep Time:\n10 mins\nCook Time:\n20 mins\nTotal Time:\n30 mins\nServings:\n6\n\nIngredients\n3 tablespoons olive oil\n\n1 onion, chopped\n\n2 cloves garlic, minced\n\n2 teaspoons minced fresh ginger root\n\n1 (15 ounce) can chickpeas, drained\n\n1 (14.5 ounce) can diced tomatoes\n\n1 (14 ounce) can coconut milk\n\n1 sweet potato, cubed\n\n1 tablespoon garam masala\n\n1 teaspoon ground cumin\n\n1 teaspoon ground turmeric\n\n\u00bd teaspoon salt\n\n\u00bc teaspoon red chile flakes\n\n1 cup baby spinach\n\n\nDirections\nStep 1\nHeat oil in a skillet over medium heat. Cook onion, garlic, and ginger in hot oil until softened, about 5 minutes. Add chickpeas, tomatoes, coconut milk, and sweet potato. Bring to a boil, reduce heat to low, and simmer until tender, about 15 minutes.\nStep 2\nSeason with garam masala, cumin, turmeric, salt, and chile flakes. Add spinach right before serving.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_167": {
"question": "How to cook this dish?v2_167_0.jpg",
"answer": "This dish is called \"Lime Chicken Soft Tacos\".\n\nPrep Time:\n20 mins\nCook Time:\n30 mins\nTotal Time:\n50 mins\nYield:\n10 servings\n\nIngredients\n1 \u00bd pounds skinless, boneless chicken breast meat - cubed\n\n2 green onions, chopped\n\n\u215b cup red wine vinegar\n\n\u00bd lime, juiced\n\n2 cloves garlic, minced\n\n1 teaspoon dried oregano\n\n1 teaspoon white sugar\n\n\u00bd teaspoon salt\n\n\u00bd teaspoon ground black pepper\n\n10 (6 inch) flour tortillas\n\n1 tomato, diced\n\n\u00bc cup shredded lettuce\n\n\u00bc cup shredded Monterey Jack cheese\n\n\u00bc cup salsa\n\nDirections\nStep 1\nSaut\u00e9 chicken in a medium saucepan over medium high heat until tender, about 15 to 20 minutes. Add green onions, vinegar, lime juice, garlic, oregano, sugar, salt, and pepper. Simmer over low heat for 10 minutes.\nStep 2\nHeat an iron skillet over medium heat. Place a tortilla in the pan, warm, and turn over to heat the other side. Repeat with remaining tortillas. Serve lime chicken mixture in warm tortillas topped with tomato, lettuce, cheese and salsa.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_168": {
"question": "Can you give a short introduction to this movie?v2_168_0.jpg",
"answer": "The Shawshank Redemption is a 1994 American drama film written and directed by Frank Darabont, based on the 1982 Stephen King novella Rita Hayworth and Shawshank Redemption. The film tells the story of banker Andy Dufresne (Tim Robbins), who is sentenced to life in Shawshank State Penitentiary for the murders of his wife and her lover, despite his claims of innocence. Over the following two decades, he befriends a fellow prisoner, contraband smuggler Ellis \"Red\" Redding (Morgan Freeman), and becomes instrumental in a money laundering operation led by the prison warden Samuel Norton (Bob Gunton). William Sadler, Clancy Brown, Gil Bellows, and James Whitmore appear in supporting roles.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_169": {
"question": "Can you give a short introduction to this movie?v2_169_0.jpg",
"answer": "The Godfather is a 1972 American crime film[2] directed by Francis Ford Coppola, who co-wrote the screenplay with Mario Puzo, based on Puzo's best-selling 1969 novel of the same title. The film stars Marlon Brando, Al Pacino, James Caan, Richard Castellano, Robert Duvall, Sterling Hayden, John Marley, Richard Conte, and Diane Keaton. It is the first installment in The Godfather trilogy, chronicling the Corleone family under patriarch Vito Corleone (Brando) from 1945 to 1955. It focuses on the transformation of his youngest son, Michael Corleone (Pacino), from reluctant family outsider to ruthless mafia boss.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_170": {
"question": "Can you give a short introduction to this movie?v2_170_0.jpg",
"answer": "The Dark Knight is a 2008 superhero film directed by Christopher Nolan from a screenplay he co-wrote with his brother Jonathan. Based on the DC Comics superhero, Batman, it is the sequel to Batman Begins (2005) and the second installment in The Dark Knight Trilogy. The plot follows the vigilante Batman, police lieutenant James Gordon, and district attorney Harvey Dent, who form an alliance to dismantle organized crime in Gotham City. Their efforts are derailed by the Joker, an anarchistic mastermind who seeks to test how far Batman will go to save the city from chaos. The ensemble cast includes Christian Bale, Michael Caine, Heath Ledger, Gary Oldman, Aaron Eckhart, Maggie Gyllenhaal, and Morgan Freeman.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_171": {
"question": "Can you give a short introduction to this movie?v2_171_0.jpg",
"answer": "Twelve Angry Men is an American courtroom drama written by Reginald Rose concerning the jury of a homicide trial. It was broadcast initially as a television play in 1954. The following year it was adapted for the stage. It was adapted for a film of the same name, directed by Sidney Lumet and released in 1957. Since then it has been given numerous remakes, adaptations, and tributes.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_172": {
"question": "Can you give a short introduction to this movie?v2_172_0.jpg",
"answer": "Schindler's List is a 1993 American epic historical drama film directed and produced by Steven Spielberg and written by Steven Zaillian. It is based on the 1982 novel Schindler's Ark by Australian novelist Thomas Keneally. The film follows Oskar Schindler, a German industrialist who saved more than a thousand mostly Polish\u2013Jewish refugees from the Holocaust by employing them in his factories during World War II. It stars Liam Neeson as Schindler, Ralph Fiennes as SS officer Amon G\u00f6th, and Ben Kingsley as Schindler's Jewish accountant Itzhak Stern.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_173": {
"question": "Can you give a short introduction to this movie?v2_173_0.jpg",
"answer": "The Lord of the Rings: The Return of the King is a 2003 epic fantasy adventure film directed by Peter Jackson from a screenplay by Fran Walsh, Philippa Boyens, and Jackson. It is based on 1955's The Return of the King, the third volume of the novel The Lord of the Rings by J. R. R. Tolkien. The sequel to 2002's The Lord of the Rings: The Two Towers, the film is the final instalment in The Lord of the Rings trilogy. It features an ensemble cast including Elijah Wood, Ian McKellen, Liv Tyler, Viggo Mortensen, Sean Astin, Cate Blanchett, John Rhys-Davies, Bernard Hill, Billy Boyd, Dominic Monaghan, Orlando Bloom, Hugo Weaving, Miranda Otto, David Wenham, Karl Urban, John Noble, Andy Serkis, Ian Holm, and Sean Bean. Continuing the plot of the previous film, Frodo, Sam and Gollum are making their final way toward Mount Doom to destroy the One Ring, unaware of Gollum's true intentions, while Merry, Pippin, Gandalf, Aragorn, Legolas, Gimli and the others join forces together against Sauron and his legions in Minas Tirith.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_174": {
"question": "Can you give a short introduction to this movie?v2_174_0.jpg",
"answer": "Pulp Fiction is a 1994 American crime film written and directed by Quentin Tarantino from a story he conceived with Roger Avary.[3] It tells four intertwining tales of crime and violence in Los Angeles, California. The film stars John Travolta, Samuel L. Jackson, Bruce Willis, Tim Roth, Ving Rhames, and Uma Thurman. The title refers to the pulp magazines and hardboiled crime novels popular during the mid-20th century, known for their graphic violence and punchy dialogue.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_175": {
"question": "Can you give a short introduction to this movie?v2_175_0.jpg",
"answer": "The Lord of the Rings: The Fellowship of the Ring is a 2001 epic fantasy adventure film directed by Peter Jackson from a screenplay by Fran Walsh, Philippa Boyens, and Jackson, based on 1954's The Fellowship of the Ring, the first volume of the novel The Lord of the Rings by J. R. R. Tolkien. The film is the first installment in The Lord of the Rings trilogy. It features an ensemble cast including Elijah Wood, Ian McKellen, Liv Tyler, Viggo Mortensen, Sean Astin, Cate Blanchett, John Rhys-Davies, Billy Boyd, Dominic Monaghan, Orlando Bloom, Christopher Lee, Hugo Weaving, Sean Bean, Ian Holm, and Andy Serkis.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_176": {
"question": "Can you give a short introduction to this movie?v2_176_0.jpg",
"answer": "The Godfather Part II is a 1974 American epic crime film produced and directed by Francis Ford Coppola. The film is partially based on the 1969 novel The Godfather by Mario Puzo, who co-wrote the screenplay with Coppola, and it is both a sequel and a prequel to the 1972 film The Godfather, presenting parallel dramas: one picks up the 1958 story of Michael Corleone (Al Pacino), the new Don of the Corleone family, protecting the family business in the aftermath of an attempt on his life; the prequel covers the journey of his father, Vito Corleone (Robert De Niro), from his Sicilian childhood to the founding of his family enterprise in New York City. The ensemble cast also features Robert Duvall, Diane Keaton, Talia Shire, Morgana King, John Cazale, Mariana Hill, and Lee Strasberg.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_177": {
"question": "Can you give a short introduction to this movie?v2_177_0.jpg",
"answer": "Farewell My Concubine is a 1993 Chinese historical drama film directed by Chen Kaige, starring Leslie Cheung, Gong Li and Zhang Fengyi. Adapted for the screen by Lu Wei based on the novel by Lilian Lee, the film is set in a politically tumultuous 20th-century China, from the early days of the Republic of China to the aftermath of the Cultural Revolution. It chronicles the troubled relationships between two Peking opera actors and lifelong friends Cheng Dieyi (Cheung) and Duan Xiaolou (Zhang), and Xiaolou's wife Juxian (Gong).",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_178": {
"question": "Can you give a short introduction to this painting?v2_178_0.jpg",
"answer": "The Mona Lisa is a half-length portrait painting by Italian artist Leonardo da Vinci.\n\nConsidered an archetypal masterpiece of the Italian Renaissance,it has been described as \"the best known, the most visited, the most written about, the most sung about, the most parodied work of art in the world\". The painting's novel qualities include the subject's enigmatic expression, monumentality of the composition, the subtle modelling of forms, and the atmospheric illusionism.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_179": {
"question": "Can you give a short introduction to this painting?v2_179_0.jpg",
"answer": "Girl With A Pearl Earring (Dutch: Meisje met de parel) is an oil painting by Dutch Golden Age painter Johannes Vermeer, dated c. 1665. Going by various names over the centuries, it became known by its present title towards the end of the 20th century after the earring worn by the girl portrayed there. The work has been in the collection of the Mauritshuis in The Hague since 1902 and has been the subject of various literary and cinematic treatments.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_180": {
"question": "Can you give a short introduction to this painting?v2_180_0.jpg",
"answer": "The Starry Night is an oil-on-canvas painting by the Dutch Post-Impressionist painter Vincent van Gogh. Painted in June 1889, it depicts the view from the east-facing window of his asylum room at Saint-R\u00e9my-de-Provence, just before sunrise, with the addition of an imaginary village.It has been in the permanent collection of the Museum of Modern Art in New York City since 1941, acquired through the Lillie P. Bliss Bequest. Widely regarded as Van Gogh's magnum opus, The Starry Night is one of the most recognizable paintings in Western art.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_181": {
"question": "Can you give a short introduction to this painting?v2_181_0.jpg",
"answer": "The Kiss (in German Der Kuss) is an oil-on-canvas painting with added gold leaf, silver and platinum by the Austrian Symbolist painter Gustav Klimt.It was painted at some point in 1907 and 1908, during the height of what scholars call his \"Golden Period\". It was exhibited in 1908 under the title Liebespaar (the lovers) as stated in the catalogue of the exhibition. The painting depicts a couple embracing each other, their bodies entwined in elaborate beautiful robes decorated in a style influenced by the contemporary Art Nouveau style and the organic forms of the earlier Arts and Crafts movement.\n\nThe painting now hangs in the \u00d6sterreichische Galerie Belvedere museum in the Belvedere, Vienna, and is considered a masterpiece of Vienna Secession (local variation of Art Nouveau) and Klimt's most popular work after Portrait of Adele Bloch-Bauer I. It is considered by many as a famous work of art.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_182": {
"question": "Can you give a short introduction to this painting?v2_182_0.jpg",
"answer": "The Birth of Venus is a painting by the Italian artist Sandro Botticelli, probably executed in the mid 1480s. It depicts the goddess Venus arriving at the shore after her birth, when she had emerged from the sea fully-grown (called Venus Anadyomene and often depicted in art). The painting is in the Uffizi Gallery in Florence, Italy.\n\nAlthough the two are not a pair, the painting is inevitably discussed with Botticelli's other very large mythological painting, the Primavera, also in the Uffizi. They are among the most famous paintings in the world, and icons of the Italian Renaissance; of the two, the Birth is better known than the Primavera. As depictions of subjects from classical mythology on a very large scale they were virtually unprecedented in Western art since classical antiquity, as was the size and prominence of a nude female figure in the Birth. It used to be thought that they were both commissioned by the same member of the Medici family, but this is now uncertain.\n\nThey have been endlessly analysed by art historians, with the main themes being: the emulation of ancient painters and the context of wedding celebrations (generally agreed), the influence of Renaissance Neo-Platonism (somewhat controversial), and the identity of the commissioners (not agreed). Most art historians agree, however, that the Birth does not require complex analysis to decode its meaning, in the way that the Primavera probably does. While there are subtleties in the painting, its main meaning is a straightforward, if individual, treatment of a traditional scene from Greek mythology, and its appeal is sensory and very accessible, hence its enormous popularity.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_183": {
"question": "Can you give a short introduction to this painting?v2_183_0.jpg",
"answer": "Arrangement in Grey and Black No. 1, best known under its colloquial name Whistler's Mother or Portrait of Artist's Mother, is a painting in oils on canvas created by the American-born painter James Abbott McNeill Whistler in 1871. The subject of the painting is Whistler's mother, Anna McNeill Whistler. The painting is 56.81 by 63.94 inches (1,443 mm \u00d7 1,624 mm), displayed in a frame of Whistler's own design. It is held by the Mus\u00e9e d'Orsay in Paris, having been bought by the French state in 1891. It is one of the most famous works by an American artist outside the United States. It has been variously described as an American icon and a Victorian Mona Lisa.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_184": {
"question": "Can you give a short introduction to this painting?v2_184_0.jpg",
"answer": "The Arnolfini Portrait (or The Arnolfini Wedding, The Arnolfini Marriage, the Portrait of Giovanni Arnolfini and his Wife, or other titles) is a 1434 oil painting on oak panel by the Early Netherlandish painter Jan van Eyck. It forms a full-length double portrait, believed to depict the Italian merchant Giovanni di Nicolao Arnolfini and his wife, presumably in their residence at the Flemish city of Bruges.\n\nIt is considered one of the most original and complex paintings in Western art, because of its beauty, complex iconography, geometric orthogonal perspective, and expansion of the picture space with the use of a mirror. According to Ernst Gombrich \"in its own way it was as new and revolutionary as Donatello's or Masaccio's work in Italy. A simple corner of the real world had suddenly been fixed on to a panel as if by magic... For the first time in history the artist became the perfect eye-witness in the truest sense of the term\". The portrait has been considered by Erwin Panofsky and some other art historians as a unique form of marriage contract, recorded as a painting. Signed and dated by van Eyck in 1434, it is, with the Ghent Altarpiece by the same artist and his brother Hubert, the oldest very famous panel painting to have been executed in oils rather than in tempera. The painting was bought by the National Gallery in London in 1842.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_185": {
"question": "Can you give a short introduction to this painting?v2_185_0.jpg",
"answer": "Along the River During the Qingming Festival (Qingming Shanghe Tu) is a handscroll painting by the Song dynasty painter Zhang Zeduan (1085\u20131145) and copied many times in the following centuries. It captures the daily life of people and the landscape of the capital, Bianjing (present-day Kaifeng) during the Northern Song. The theme is often said to celebrate the festive spirit and worldly commotion at the Qingming Festival, rather than the holiday's ceremonial aspects, such as tomb sweeping and prayers. Read right to left, as a viewer unrolled it, successive scenes reveal the lifestyle of all levels of the society from rich to poor as well as economic activities in rural areas and the city, and offer glimpses of period clothing and architecture. The painting is considered to be the most renowned work among all Chinese paintings, and it has been called \"China's Mona Lisa.\"",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_186": {
"question": "Can you give a short introduction to this painting?v2_186_0.jpg",
"answer": "Dwelling in the Fuchun Mountains is one of the few surviving works by Chinese painter Huang Gongwang (1269\u20131354) and is considered to be among his greatest works. Painted between 1348 and 1350, the painting was burnt into two pieces in 1650. Today, one piece is kept in the Zhejiang Provincial Museum in Hangzhou, while the other piece is kept in the National Palace Museum in Taipei. Put together, the entire painting would measure 691.3 cm in length.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_187": {
"question": "Can you give a short introduction to this painting?v2_187_0.jpg",
"answer": "Emperor Taizong Receiving the Tibetan Envoy (also called \u6b65\u8f87\u56fe, B\u00f9ni\u01cen T\u00fa ) is a painting on silk by Yan Liben to show the friendly encounter between the Tang dynasty and Tibet. The painting is 129 centimetres (51 in) long by 38.5 centimetres (15.2 in) wide. Bunian Tu is in The Palace Museum in Beijing.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_188": {
"question": "What is this disease (give short introduction) and how to treat it?v2_188_0.jpg",
"answer": "Cedar apple rust (Gymnosporangium juniperi-virginianae) is a fungal disease that requires juniper plants to complete its complicated two year life-cycle. Spores overwinter as a reddish-brown gall on young twigs of various juniper species. In early spring, during wet weather, these galls swell and bright orange masses of spores are blown by the wind where they infect susceptible apple and crab-apple trees. The spores that develop on these trees will only infect junipers the following year. From year to year, the disease must pass from junipers to apples to junipers again; it cannot spread between apple trees.\n\nOn apple and crab-apple trees, look for pale yellow pinhead sized spots on the upper surface of the leaves shortly after bloom. These gradually enlarge to bright orange-yellow spots which make the disease easy to identify. Orange spots may develop on the fruit as well. Heavily infected leaves may drop prematurely.\n\nTreatment\n1. Choose resistant cultivars when available.\n2. Rake up and dispose of fallen leaves and other debris from under trees.\n3. Remove galls from infected junipers. In some cases, juniper plants should be removed entirely.\n4. Apply preventative, disease-fighting fungicides labeled for use on apples weekly, starting with bud break, to protect trees from spores being released by the juniper host. This occurs only once per year, so additional applications after this springtime spread are not necessary.\n5. On juniper, rust can be controlled by spraying plants with a copper solution (0.5 to 2.0 oz/ gallon of water) at least four times between late August and late October.\n6. Safely treat most fungal and bacterial diseases with SERENADE Garden. This broad spectrum bio-fungicide uses a patented strain of Bacillus subtilis that is registered for organic use. Best of all, SERENADE is completely non-toxic to honey bees and beneficial insects.\n7. Containing sulfur and pyrethrins, Bonide\u00ae Orchard Spray is a safe, one-hit concentrate for insect attacks and fungal problems. For best results, apply as a protective spray (2.5 oz/ gallon) early in the season. If disease, insects or wet weather are present, mix 5 oz in one gallon of water. Thoroughly spray all parts of the plant, especially new shoots.\n8. Contact your local Agricultural Extension office for other possible solutions in your area.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_189": {
"question": "What is this disease (give short introduction) and how to treat it?v2_189_0.jpg",
"answer": "Anthracnose. It is caused by fungi in the genus Colletotrichum, a common group of plant pathogens that are responsible for diseases on many plant species. Infected plants develop dark, water soaked lesions on stems, leaves or fruit. The centers of these lesions often become covered with pink, gelatinous masses of spores especially during moist, warm weather. Anthracnose can reduce a beautiful harvest into rotted waste in just a few days.\n\nThe fungal disease overwinters in and on seeds, soil and garden debris. Cool wet weather promotes its development, and the optimum temperature for continued growth of the spores is between 75-85\u02daF. Moisture is required for development and germination of the fungus as well as for infection of the plant. It is spread by wind, rain, insects and garden tools.\n\nTreatment\n1. Choose resistant plant varieties when possible and use western grown seeds which have not been exposed to the disease.\n2. If this fungal problem is common, do NOT save your own seed from plantings.\n3. To avoid spreading the disease, keep out of gardens when plants are wet and make sure to disinfect all garden tools (one part bleach to 4 parts water) after use.\n4. Do not compost infected leaves, fruit or stems and thoroughly clean up garden areas in the fall, after harvest, to reduce over wintering sites for the fungal spores.\n5. Safely treat most fungal and bacterial diseases with SERENADE Garden. This broad spectrum bio-fungicide uses a patented strain of Bacillus subtilis that is registered for organic use. Best of all, SERENADE is completely non-toxic to honey bees and beneficial insects.\n6. Liquid copper sprays and sulfur powders should be applied weekly, starting when foliage begins to develop in the early spring and continuing throughout the growing season. Spray early in the day, and avoid applications during hot weather. Seeds may also be treated prior to planting.\n7. Neem oil spray is an organic, multi-purpose fungicide/insecticide/miticide that kills eggs, larvae and adult stages of insects as well as prevents fungal attack on plants. Apply early, at the first sign of spring budding, every 7-14 days as a preventative measure or on a 7-day schedule until existing problems are eliminated.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_190": {
"question": "What is this disease (give short introduction) and how to treat it?v2_190_0.jpg",
"answer": "It is bacterial canker, most common on cherries and plums, but may also affect apricots, peaches and many other kinds of stone fruits. Suspect this plant disease if sunken, water-soaked or \u201cgummy\u201d lesions form on the trunk or twigs. When trees begin active growth in the spring, a sour smelling sap may ooze from these wounded areas. The cankers become darker than the surrounding healthy bark, and the underlying tissue is reddish-brown to black and moist.\n\nNote: If cankers girdle the branches or trunk, the leaves above the diseased area curl and turn yellow. Growth stops and the branch or tree will eventually die.\n\nThe bacterium that causes canker, Pseudomonas syringae, enters trees through injured bark or an existing wound, such as a pruning cut on a twig or branch. Frost damage in the spring may promote additional infections. Bacterial canker infections occur during fall, winter and early spring (during cool, wet weather) and are spread by rain or water, and pruning tools. The bacteria overwinter in active cankers, in infected buds and on the surface of infected and healthy trees and weeds.\n\nTreatment\n1. Prune flowering trees during blooming when wounds heal fastest.\n2. Remove wilted or dead limbs well below infected areas.\n3. Avoid pruning in early spring and fall when bacteria are most active.\n4. Treat all pruning cuts immediately with Tanglefoot\u00ae Tree Pruning Sealer and make sure to disinfect your pruning equipment \u2014 one part bleach to 4 parts water \u2014 after each cut.\n5. If using string trimmers around the base of trees avoid damaging bark with breathable Tree Wrap to prevent infection.\n6. Brush bark with white latex paint diluted with water to reduce bark-damaging temperature fluctuations.\n7. Research has shown that copper fungicides have some success against this stone fruit problem. However, results are inconsistent. We recommend using it as one part of a total management program.\n8. Remove weeds and grass from around the base of young trees to improve air circulation and keep the trunk and crown dry.\n9. Organocide\u00ae Plant Doctor is an earth-friendly systemic fungicide that works its way through the entire plant to combat a large number of diseases on ornamentals, turf, fruit and more. Mix 1/3 to 3/4 oz per gallon of water and paint or spray over pruning wounds and surrounding areas.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_191": {
"question": "What is this disease (give short introduction) and how to treat it?v2_191_0.jpg",
"answer": "It is blossom end rot. A serious disorder of tomato, pepper, cucumber and eggplant, blossom end rot is an environmental problem (not fungal) most often caused by uneven watering or by calcium deficiency. (These can be related; uneven watering can interfere with the uptake of calcium.) This common garden \u201cdisease\u201d is often brought on by rapid growth from too much fertilizer, high salt levels or drought.\n\nBlossom end rot symptoms occur on both green and ripe fruits and is identified by water-soaked areas that gradually widen and mature into sunken, brown, leathery spots on the bottom end. In many cases, secondary pathogens, which appear as a black, fuzzy-like growth, attack the affected area and cause complete rotting of the fruit. Blossom end rot will not spread from plant to plant.\n\nTreatment\nSince this plant problem is physiological in nature, fungicides will not work as a control measure. We recommend the following:\n\n1. Choose resistant vegetable varieties whenever possible.\n2. Prevent problems by keeping soil evenly moist and by foliar spraying plants with a kelp or calcium solution.\n3. Adding high levels of calcium \u2014 bone meal, oyster shell or gypsum \u2014 to the soil at planting time usually prevents this problem from developing.\n4. A layer of mulch (straw, compost, grass ) will help conserve soil moisture during the hot, dry days of July and August.\n5. Foliar applications of Liquid Calcium 5% (1-2 Tbsp/ gallon of water) can be used to correct or prevent deficiencies of this essential nutrient. For best results, combine with a natural surfactant to increase adhesion and spray leaves to the point of run-off.\n6. Mulching plants will help conserve moisture and provide a more uniform water supply.\n7. Avoid using high nitrogen fertilizers which accelerate vegetative growth and reduce the uptake of calcium by plants. A large selection of balanced organic fertilizers are available at Planet Natural.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_192": {
"question": "What is this disease (give short introduction) and how to treat it?v2_192_0.jpg",
"answer": "It is Brown rot (Monilinia fructicola), the most common fungal disease affecting the blossoms and fruit of almonds, apricots, cherries, peaches and plums. It overwinters in mummified fruit (on the tree and on the ground) and infected twigs.\n\nThe disease first infects blossoms in spring and grows back into the small branches to cause cankers that can kill stems. Large numbers of flower-bearing stems are killed when the disease is severe. Dead flowers often remain attached into the summer. Developing or mature fruits show circular or brown spots that spread rapidly over the surface and light gray masses of spores are produced on the rotted areas. Rotted tissue remains relatively firm and dry.\n\nBrown rot spores are carried by wind, rain and insects to the open or unopened blossoms and young shoots. If water is present \u2014 either from rain, dew or watering \u2014 on the flower surface the spores can germinate and penetrate the plant. Disease development takes place over a wide temperature range and flowers can be infected from the time buds open until petals fall. Under favorable conditions, brown rot spreads quickly and an entire crop can be completely destroyed on the tree.\n\nTreatment\n1. Choose resistant varieties whenever possible.\n2. Prompt removal and destruction of infected plant parts helps breaks the life cycle of the disease in individual trees and small orchards, and may be sufficient to keep brown rot below damaging levels.\n3. It is important to rake up and remove any fallen fruit or debris from under trees.\n4. Prune trees occasionally to improve air circulation. Also, water from below to keep from wetting blossoms, foliage and fruit.\n5. Use Tanglefoot\u00ae Pruning Sealer to seal all cuts and wounds and protect against insects and disease organisms.\n6. Ready to use copper fungicides or sulfur powders should be applied weekly to infected trees starting when the blossoms are just beginning to open and continuing throughout the growing season. If at all possible, time applications so that 12 hours of dry weather follows application.\n7. Organocide\u00ae Plant Doctor is an earth-friendly systemic fungicide that works its way through the entire plant to combat a large number of diseases on ornamentals, turf, fruit and more. Apply as a foliar spray (1 tsp/ gallon of water) to combat this destructive stone fruit problem.\n8. Containing sulfur and pyrethrins, Bonide\u00ae Orchard Spray is a safe, one-hit concentrate for insect attacks and fungal problems. For best results, apply as a protective spray (2.5 oz/ gallon) early in the season. If disease, insects or wet weather are present, mix 5 oz in one gallon of water. Thoroughly spray all parts of the plant, especially new shoots.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_193": {
"question": "What is this disease (give short introduction) and how to treat it?v2_193_0.jpg",
"answer": "It is club root. Affecting most brassica crops (cabbage, broccoli, cauliflower, etc.), club root is a serious plant disease in North American home gardens. It is caused by the soil-borne fungus Plasmodiophora brassicae which infects susceptible plants through root hairs. Diseased roots become swollen, misshapen and deformed (clubbed) often cracking and rotting. As a result, plants have difficulty absorbing water and nutrients properly.\n\nPlants often grow poorly and wilt during the heat of the day; plants often revive during cool nights. Outer leaves may turn yellow, purple or brown. Club root will reduce yields and can cause total crop failure.\n\nFungal spores can be spread by wind, water and garden tools. Disease development can occur over a wide range of conditions, but is favored by excessive moisture, low soil pH and soil temperatures between 64 and 77\u02daF. Spores can survive in the soil for as many as 10 years.\n\nTreatment\n1. Fungicides will NOT treat this soil-dwelling micro-organism.\n2. Choose resistant cultivars when possible.\n3. Try to prevent the occurrence of this disease by keeping a clean garden and rotating crops.\n4. Keep in mind that the disease spores can persist in the soil for up to 20 years. If club root is present you may want to solarize the soil.*\n5. Control susceptible weeds \u2014 mustard, radish, shepherd\u2019s purse \u2014 that may be infected to reduce potential buildup of the disease.\n6. Carefully remove infected plants and sterilize garden tools (one part bleach to 4 parts water) after use.\n7. Raise your soil\u2019s pH to a more alkaline 7.2 by mixing oyster shell or dolomite lime into your garden in the fall. Simple and affordable soil test kits are available to check pH often.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_194": {
"question": "What is this disease (give short introduction) and how to treat it?v2_194_0.jpg",
"answer": "It is corn smut. Frequently found in backyard gardens and small farms, corn smut is caused by the fungus Ustilago zeae and can appear in the stalks, leaves, tassels or ears. Symptoms are most commonly noticed when the ears produce mushroom-like tumors or galls. These \u201cswellings\u201d begin as small, whitish-gray irregularities which expand and turn black as they fill with spores. Ear galls can grow to 4- to 5-inches in diameter and release thousands of spores as they rupture. These fungal spores are blown by the wind for considerable distances to infect new plants. Galls on leaves remain small and eventually become hard and dry.\n\nCorn smut overwinters on garden debris and in the soil. It is carried by wind, rain and irrigation and does best in hot, dry weather. Spores may remain viable for 5- to 7-years. Wounds from various injuries, including cultivation and abrasion from blowing soil, provide points for the fungus to enter the plant.\n\nTreatment\n1. Choose the best resistant varieties, such as silver king, fantasia, brilliant and seneca sensation, when available.\n2. In backyard gardens, collecting and destroying galls before the dark fungal spores are released is suggested. This will limit the number of available fungal spores and help break the disease-cycle.\n3. Reduce infection points by avoiding injury of roots, stalks and leaves during cultivation.\n4. Prevent damage from insects, such as corn borers, with Monterey\u00ae Garden Insect Spray or other organic insecticide.\n5. Fungicides are NOT an effective control option since the disease is so widespread and can persist in the soil for years.\n6. High nitrogen fertilizers may increase the severity of the disease \u2014 use a balanced organic fertilizer in the vegetable garden.\n7. Remove and destroy all garden debris after harvest and practice crop rotation the following year.\n8. Bag or burn infected plant parts \u2014 do NOT compost.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_195": {
"question": "What is this disease (give short introduction) and how to treat it?v2_195_0.jpg",
"answer": "It is crown gall, a common plant disease caused by the soil-borne bacterium Agrobacterium tumefaciens. It is found throughout the world and occurs on woody shrubs and herbaceous plants including grapes, raspberries, blackberries and roses.\n\nCrown gall symptoms include round, wart-like growths \u2014 2 inches or larger in diameter \u2014 that appear at or just above the soil line, or on lower branches and stems. Plants with several galls may be unable to move water and nutrients up the trunk and become weakened, stunted and unproductive. Young plants can be killed by developing gall tissue.\n\nThe bacteria responsible for crown gall can persist in the soil for many years and are released when galls become saturated with moisture or as older galls decompose. Susceptible plants are infected through fresh wounds or abrasions, many of which are a result of pruning, freeze injury, soil insects, cultivation and other factors that may damage plants. Nursery stock is often infected through grafting and budding scars.\n\nTreatment\n1. Select resistant cultivars when possible and purchase plants from a reputable nursery.\n2. Do not buy plants that shows signs of swelling or galling.\n3. When caring for susceptible plants, avoid injury or pruning wounds that may come in contact with the soil.\n4. Use Tree Wrap to protect against string trimmer damage and keep your garden tools clean.\n5. Provide winter protection with natural burlap so bark does not crack.\n6. In many cases, existing galls can be removed with a sharp pruning knife. Destroy the infected plant tissue and treat the wound with pruning sealer. If the plant does not recover, remove and destroy it.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_196": {
"question": "What is this disease (give short introduction) and how to treat it?v2_196_0.jpg",
"answer": "It is gray mold (Botrytis cinerea). Found on a wide range of plants (too many to mention), gray mold is a fungal disease that travels quickly through gardens, especially during damp, cool to mild weather. Disease symptoms appear as grayish colored soft, mushy spots on leaves, stems, flowers and on produce. Spots may become covered with a coating of gray fungus spores, especially if humidity is high. Fruit or plants shrivel and rot and often develop black, stone-like sclerotia \u2014 a compact mass of hardened fungal filaments \u2014 under rotted parts.\n\nGray mold is often found near the soil surface or in the densest areas of the plant canopy. It develops on wilted flowers first, then spreads quickly to other parts of the plant. The disease may also occur in storage areas causing rotting of harvested fruits and vegetables.\n\nBotrytis blight overwinters on plants, in or on the soil, and as sclerotia. Spores develop when conditions are optimal, and are moved by wind or splashing water onto blossoms or young leaves, where they germinate and enter the plant. Spores require cool temperatures (45-60 F.) and high humidity (93% and above) to germinate. Germinating spores rarely penetrate green, healthy tissue directly, but can enter through wounds on growing plants. Cuttings are particularly susceptible to infection.\n\nTreatment\n1. Prune or stake plants to improve air circulation between plants. Make sure to disinfect your pruning equipment (one part bleach to 4 parts water) after each cut.\n2. If growing indoors use a small clip-on fan to improve air flow.\n3. Keep the soil under plants clean and rake up any fallen debris.\n4. Add a good amount of organic compost or mulch under plants. Mulches will prevent the fungal spores from splashing back up onto flowers and leaves.\n5. Water in the early morning hours, or use a soaker hose, to give plants time to dry out during the day.\n6. Do not compost infected plant leaves or stems, and thoroughly clean up garden areas in the fall to reduce over wintering sites for the fungal spores.\n7. Copper-Soap fungicides will help by protecting plants from disease spores. Apply at the start of flowering and continue every 7-10 days until harvest. Fungicidal sprays are especially warranted when weather forecasts predict a long period of cool, wet weather.\n8. Safely treat most fungal diseases, including Botrytis blight, with SERENADE Garden. This broad spectrum bio-fungicide uses a patented strain of Bacillus subtilis that is registered for organic use. Best of all, SERENADE is completely non-toxic to honey bees and beneficial insects.\n9. Mycostop, a biological fungicide approved for organic use, has shown suppression of the disease. Direct spray (5 gm/ 50 liters of water) to susceptible leaves, flowers and fruits to point of run-off. Apply every 2-3 weeks, or as needed depending on disease pressure.\n10. Green Cure Fungicide contains a patented formula of potassium bicarbonate \u2014 commonly used in food products \u2014 that kills many plant diseases on contact and provides up to 2 weeks of residual protection. At first sign of disease, mix 1-2 Tbsp/ gallon of water and apply to all exposed surfaces of the plant. For best protection, repeat at 1-2 week intervals until conditions are no longer favorable for disease development.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_197": {
"question": "What is this disease (give short introduction) and how to treat it?v2_197_0.jpg",
"answer": "It is early blight. Common on tomato and potato plants, early blight is caused by the fungus Alternaria solani and occurs throughout the United States. Symptoms first appear on the lower, older leaves as small brown spots with concentric rings that form a \u201cbull\u2019s eye\u201d pattern. As the disease matures, it spreads outward on the leaf surface causing it to turn yellow, wither and die. Eventually the stem, fruit and upper portion of the plant will become infected. Crops can be severely damaged.\n\nEarly blight overwinters on infected plant tissue and is spread by splashing rain, irrigation, insects and garden tools. The disease is also carried on tomato seeds and in potato tubers. In spite of its name, early blight can occur any time throughout the growing season. High temperatures (80-85\u02daF.) and wet, humid conditions promote its rapid spread. In many cases, poorly nourished or stressed plants are attacked.\n\nTreatment\nPrune or stake plants to improve air circulation and reduce fungal problems.\nMake sure to disinfect your pruning shears (one part bleach to 4 parts water) after each cut.\nKeep the soil under plants clean and free of garden debris. Add a layer of organic compost to prevent the spores from splashing back up onto vegetation.\nDrip irrigation and soaker hoses can be used to help keep the foliage dry.\nFor best control, apply copper-based fungicides early, two weeks before disease normally appears or when weather forecasts predict a long period of wet weather. Alternatively, begin treatment when disease first appears, and repeat every 7-10 days for as long as needed.\nContaining copper and pyrethrins, Bonide\u00ae Garden Dust is a safe, one-step control for many insect attacks and fungal problems. For best results, cover both the tops and undersides of leaves with a thin uniform film or dust. Depending on foliage density, 10 oz will cover 625 sq ft. Repeat applications every 7-10 days, as needed.\nSERENADE Garden is a broad spectrum, preventative bio-fungicide recommended for the control or suppression of many important plant diseases. For best results, treat prior to foliar disease development or at the first sign of infection. Repeat at 7-day intervals or as needed.\nRemove and destroy all garden debris after harvest and practice crop rotation the following year.\nBurn or bag infected plant parts. Do NOT compost.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_198": {
"question": "Can you give a short introduction to this person?v2_198_0.jpg",
"answer": "Sir Isaac Newton FRS (25 December 1642 \u2013 20 March 1726/27) was an English mathematician, physicist, astronomer, alchemist, theologian, and author who was described in his time as a natural philosopher. He was a key figure in the Scientific Revolution and the Enlightenment that followed. His pioneering book Philosophi\u00e6 Naturalis Principia Mathematica (Mathematical Principles of Natural Philosophy), first published in 1687, consolidated many previous results and established classical mechanics. Newton also made seminal contributions to optics, and shares credit with German mathematician Gottfried Wilhelm Leibniz for developing infinitesimal calculus.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_199": {
"question": "Can you give a short introduction to this person?v2_199_0.jpg",
"answer": "Confucius (/k\u0259n\u02c8fju\u02d0\u0283\u0259s/ k\u0259n-FEW-sh\u0259s; Chinese: \u5b54\u592b\u5b50; pinyin: K\u01d2ng F\u016bz\u01d0, \"Master K\u01d2ng\"; or commonly \u5b54\u5b50; K\u01d2ngz\u01d0; c.\u2009551 \u2013 c.\u2009479 BCE) was a Chinese philosopher and politician of the Spring and Autumn period who is traditionally considered the paragon of Chinese sages. Confucius's teachings and philosophy underpin East Asian culture and society, remaining influential across China and East Asia to this day.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_200": {
"question": "Can you give a short introduction to this person?v2_200_0.jpg",
"answer": "Cai Lun (Chinese: \u8521\u4f26; courtesy name: Jingzhong (\u656c\u4ef2); c.\u200950\u201362 \u2013 121 CE), formerly romanized as Ts'ai Lun, was a Chinese eunuch court official of the Eastern Han dynasty. He is traditionally regarded as the inventor of paper and the modern papermaking process. Although early forms of paper had existed since the 3rd century BCE, he occupies a pivotal place in the history of paper due to his addition of pulp via tree bark and hemp ends which resulted in the large-scale manufacture and worldwide spread of paper.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_201": {
"question": "Can you give a short introduction to this person?v2_201_0.jpg",
"answer": "Christopher Columbus (between 25 August and 31 October 1451 \u2013 20 May 1506) was an Italian explorer and navigator from the Republic of Genoa who completed four Spanish-based voyages across the Atlantic Ocean sponsored by the Catholic Monarchs, opening the way for the widespread European exploration and European colonization of the Americas. His expeditions were the first known European contact with the Caribbean and Central and South America.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_202": {
"question": "Can you give a short introduction to this person?v2_202_0.jpg",
"answer": "Albert Einstein (14 March 1879 \u2013 18 April 1955) was a German-born theoretical physicist. Best known for developing the theory of relativity, he also made important contributions to the development of the theory of quantum mechanics, and thus to modern physics. His mass\u2013energy equivalence formula E = mc2, which arises from relativity theory, has been dubbed \"the world's most famous equation\". His work is also known for its influence on the philosophy of science. He received the 1921 Nobel Prize in Physics \"for his services to theoretical physics, and especially for his discovery of the law of the photoelectric effect\", a pivotal step in the development of quantum theory. Einsteinium, one of the synthetic elements in the periodic table, was named in his honor.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_203": {
"question": "Can you give a short introduction to this person?v2_203_0.jpg",
"answer": "Louis Pasteur ForMemRS (27 December 1822 \u2013 28 September 1895) was a French chemist and microbiologist renowned for his discoveries of the principles of vaccination, microbial fermentation, and pasteurization, the last of which was named after him. His research in chemistry led to remarkable breakthroughs in the understanding of the causes and preventions of diseases, which laid down the foundations of hygiene, public health and much of modern medicine. Pasteur's works are credited with saving millions of lives through the developments of vaccines for rabies and anthrax. He is regarded as one of the founders of modern bacteriology and has been honored as the \"father of bacteriology\" and the \"father of microbiology\" (together with Robert Koch; the latter epithet also attributed to Antonie van Leeuwenhoek).",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_204": {
"question": "Can you give a short introduction to this person?v2_204_0.jpg",
"answer": "Galileo di Vincenzo Bonaiuti de' Galilei (15 February 1564 \u2013 8 January 1642) was an Italian astronomer, physicist and engineer, sometimes described as a polymath. Commonly referred to as Galileo, his name is pronounced /\u02cc\u0261\u00e6l\u026a\u02c8le\u026a.o\u028a \u02cc\u0261\u00e6l\u026a\u02c8le\u026a.i\u02cc/ (GAL-ih-LAY-oh GAL-ih-LAY-ee, Italian: [\u0261ali\u02c8l\u025b\u02d0o \u0261ali\u02c8l\u025bi]). He was born in the city of Pisa, then part of the Duchy of Florence. Galileo has been called the father of observational astronomy, modern-era classical physics, the scientific method, and modern science.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_205": {
"question": "Can you give a short introduction to this person?v2_205_0.jpg",
"answer": "Joshua Abraham Norton (February 4, 1818 \u2013 January 8, 1880), known as Emperor Norton, was a resident of San Francisco, California, who in 1859 proclaimed himself \"Norton I., Emperor of the United States\". In 1863, after Napoleon III invaded Mexico, he took the secondary title of \"Protector of Mexico\".",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_206": {
"question": "Can you give a short introduction to this person?v2_206_0.jpg",
"answer": "Lionel Andr\u00e9s Messi (Spanish pronunciation: [ljo\u02c8nel an\u02c8d\u027ees \u02c8mesi] (listen); born 24 June 1987), also known as Leo Messi, is an Argentine professional footballer who plays as a forward for Ligue 1 club Paris Saint-Germain and captains the Argentina national team. Widely regarded as one of the greatest players of all time, Messi has won a record seven Ballon d'Or awards and a record six European Golden Shoes, and in 2020 he was named to the Ballon d'Or Dream Team. Until leaving the club in 2021, he had spent his entire professional career with Barcelona, where he won a club-record 34 trophies, including ten La Liga titles, seven Copa del Rey titles and the UEFA Champions League four times. With his country, he won the 2021 Copa Am\u00e9rica and the 2022 FIFA World Cup. A prolific goalscorer and creative playmaker, Messi holds the records for most goals in La Liga (474), most hat-tricks in La Liga (36) and the UEFA Champions League (eight), and most assists in La Liga (192) and the Copa Am\u00e9rica (17). He also has the most international goals by a South American male (102). Messi has scored over 800 senior career goals for club and country, and has the most goals by a player for a single club (672).",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_207": {
"question": "Can you give a short introduction to this person?v2_207_0.jpg",
"answer": "Alan Mathison Turing OBE FRS (/\u02c8tj\u028a\u0259r\u026a\u014b/; 23 June 1912 \u2013 7 June 1954) was an English mathematician, computer scientist, logician, cryptanalyst, philosopher, and theoretical biologist. Turing was highly influential in the development of theoretical computer science, providing a formalisation of the concepts of algorithm and computation with the Turing machine, which can be considered a model of a general-purpose computer. He is widely considered to be the father of theoretical computer science and artificial intelligence.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v1"
},
"v2_208": {
"question": "The graph below shows the long-term international migration, UK, 1999-2008.\n\nSummarize the information by selecting and reporting the main features, and make comparisons where relevant.\n\nYou should write at least 150 words.v2_208_0.png",
"answer": "The chart gives information about UK immigration, emigration and net migration between 1999 and 2008.\n\nBoth immigration and emigration rates rose over the period shown, but the figures for immigration were significantly higher. Net migration peaked in 2004 and 2007.\n\nIn 1999, over 450,000 people came to live in the UK, while the number of people who emigrated stood at just under 300,000. The figure for net migration was around 160,000, and it remained at a similar level until 2003. From 1999 to 2004, the immigration rate rose by nearly 150,000 people, but there was a much smaller rise in emigration. Net migration peaked at almost 250,000 people in 2004.\n\nAfter 2004, the rate of immigration remained high, but the number of people emigrating fluctuated. Emigration fell suddenly in 2007, before peaking at about 420,000 people in 2008. As a result, the net migration figure rose to around 240,000 in 2007, but fell back to around 160,000 in 2008.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_209": {
"question": "The graph and table below give information about water use worldwide and water consumption in two different countries.\n\nSummarise the information by selecting and reporting the main features, and make comparisons where relevant.\n\nYou should write at least 150 words.v2_209_0.png",
"answer": "The charts compare the amount of water used for agriculture, industry and homes around the world, and water use in Brazil and the Democratic Republic of Congo.\n\nIt is clear that global water needs rose significantly between 1900 and 2000, and that agriculture accounted for the largest proportion of water used. We can also see that water consumption was considerably higher in Brazil than in the Congo.\n\nIn 1900, around 500km\u00b3 of water was used by the agriculture sector worldwide. The figures for industrial and domestic water consumption stood at around one fifth of that amount. By 2000, global water use for agriculture had increased to around 3000km\u00b3, industrial water use had risen to just under half that amount, and domestic consumption had reached approximately 500km\u00b3.\n\nIn the year 2000, the populations of Brazil and the Congo were 176 million and 5.2 million respectively. Water consumption per person in Brazil, at 359m\u00b3, was much higher than that in the Congo, at only 8m\u00b3, and this could be explained by the fact that Brazil had 265 times more irrigated land.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_210": {
"question": "The charts below give information about USA marriage and divorce rates between 1970 and 2000, and the marital status of adult Americans in two of the years.\n\nSummarise the information by selecting and reporting the main features, and make comparisons where relevant.\n\nYou should write at least 150 words.v2_210_0.png",
"answer": "The first bar chart shows changes in the number of marriages and divorces in the USA, and the second chart shows figures for the marital status of American adults in 1970 and 2000.\n\nIt is clear that there was a fall in the number of marriages in the USA between 1970 and 2000. The majority of adult Americans were married in both years, but the proportion of single adults was higher in 2000.\n\nIn 1970, there were 2.5 million marriages in the USA and 1 million divorces. The marriage rate remained stable in 1980, but fell to 2 million by the year 2000. In contrast, the divorce rate peaked in 1980, at nearly 1.5 million divorces, before falling back to 1 million at the end\nof the period.\n\nAround 70% of American adults were married in 1970, but this figure dropped to just under 60% by 2000. At the same time, the proportion of unmarried people and divorcees rose by about 10% in total. The proportion of widowed Americans was slightly lower in 2000.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_211": {
"question": "The chart below shows the amount spent on six consumer goods in four European countries.\n\nWrite a report for a university lecturer describing the information shown below.\n\nYou should write at least 150 words.v2_211_0.png",
"answer": "The bar chart compares consumer spending on six different items in Germany, Italy, France and Britain.\n\nIt is clear that British people spent significantly more money than people in the other three countries on all six goods. Of the six items, consumers spent the most money on photographic film.\n\nPeople in Britain spent just over \u00a3170,000 on photographic film, which is the highest figure shown on the chart. By contrast, Germans were the lowest overall spenders, with roughly the same figures (just under \u00a3150,000) for each of the six products. \n\nThe figures for spending on toys were the same in both France and Italy, at nearly \u00a3160,000. However, while French people spent more than Italians on photographic film and CDs, Italians paid out more for personal stereos, tennis racquets and perfumes. The amount spent by French people on tennis racquets, around \u00a3145,000, is the lowest figure shown on the chart.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_212": {
"question": "The table below gives information about the underground railway systems in six cities.\n\nSummarise the information by selecting and reporting the main features, and make comparisons where relevant.\n\nYou should write at least 150 words.v2_212_0.png",
"answer": "The table shows data about the underground rail networks in six major cities.\n\nThe table compares the six networks in terms of their age, size and the number of people who use them each year. It is clear that the three oldest underground systems are larger and serve significantly more passengers than the newer systems.\n\nThe London underground is the oldest system, having opened in 1863. It is also the largest system, with 394 kilometres of route. The second largest system, in Paris, is only about half the size of the London underground, with 199 kilometres of route. However, it serves more people per year. While only third in terms of size, the Tokyo system is easily the most used, with 1927 million passengers per year.\n\nOf the three newer networks, the Washington DC underground is the most extensive, with 126 kilometres of route, compared to only 11 kilometres and 28 kilometres for the Kyoto and Los Angeles systems. The Los Angeles network is the newest, having opened in 2001, while the Kyoto network is the smallest and serves only 45 million passengers per year.",
"capability": [
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_213": {
"question": "The table below gives information on consumer spending on different items in five different countries in 2002.\n\nSummarise the information by selecting and reporting the main features, and make comparisons where relevant.\n\nYou should write at least 150 words.v2_213_0.jpg",
"answer": "The table shows percentages of consumer expenditure for three categories of products and services in five countries in 2002.\n\nIt is clear that the largest proportion of consumer spending in each country went on food, drinks and tobacco. On the other hand, the leisure/education category has the lowest percentages in the table.\n\nOut of the five countries, consumer spending on food, drinks and tobacco was noticeably higher in Turkey, at 32.14%, and Ireland, at nearly 29%. The proportion of spending on leisure and education was also highest in Turkey, at 4.35%, while expenditure on clothing and footwear was significantly higher in Italy, at 9%, than in any of the other countries.\n\nIt can be seen that Sweden had the lowest percentages of national consumer expenditure for food/drinks/tobacco and for clothing/footwear, at nearly 16% and just over 5% respectively. Spain had slightly higher figures for these categories, but the lowest figure for leisure/education, at only 1.98%.",
"capability": [
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_214": {
"question": "The pie charts below show units of electricity production by fuel source in Australia and France in 1980 and 2000.\n\nSummarise the information by selecting and reporting the main features, and make comparisons where relevant.\n\nYou should write at least 150 words.v2_214_0.png",
"answer": "The pie charts compare the amount of electricity produced using five different sources of fuel in two countries over two separate years.\n\nTotal electricity production increased dramatically from 1980 to 2000 in both Australia and France. While the totals for both countries were similar, there were big differences in the fuel sources used.\n\nCoal was used to produce 50 of the total 100 units of electricity in Australia in 1980, rising to 130 out of 170 units in 2000. By contrast, nuclear power became the most important fuel source in France in 2000, producing almost 75% of the country\u2019s electricity.\n\nAustralia depended on hydro power for just under 25% of its electricity in both years, but the amount of electricity produced using this type of power fell from 5 to only 2 units in France. Oil, on the other hand, remained a relatively important fuel source in France, but its use declined in Australia. Both countries relied on natural gas for electricity production significantly more in 1980 than in 2000.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_215": {
"question": "Chorleywood is a village near London whose population has increased steadily since the middle of the nineteenth century. The map below shows the development of the village.\n\nWrite a report for a university lecturer describing the development of the village. \n\nYou should write at least 150 words.v2_215_0.jpg",
"answer": "The map shows the growth of a village called Chorleywood between 1868 and 1994.\n\nIt is clear that the village grew as the transport infrastructure was improved. Four periods of development are shown on the map, and each of the populated areas is near to the main roads, the railway or the motorway.\n\nFrom 1868 to 1883, Chorleywood covered a small area next to one of the main roads. Chorleywood Park and Golf Course is now located next to this original village area. The village grew along the main road to the south between 1883 and 1922, and in 1909 a railway line was built crossing this area from west to east. Chorleywood station is in this part of the village.\n\nThe expansion of Chorleywood continued to the east and west alongside the railway line until 1970. At that time, a motorway was built to the east of the village, and from 1970 to 1994, further development of the village took place around motorway intersections with the railway and one of the main roads.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_216": {
"question": "The map below is of the town of Garlsdon. A new supermarket (S) is planned for the town. The map shows two possible sites for the supermarket.\n\nSummarise the information by selecting and reporting the main features, and make comparisons where relevant. \n\nYou should write at least 150 words.v2_216_0.png",
"answer": "The map shows two potential locations (S1 and S2) for a new supermarket in a town called Garlsdon.\n\nThe main difference between the two sites is that S1 is outside the town, whereas S2 is in the town centre. The sites can also be compared in terms of access by road or rail, and their positions relative to three smaller towns.\n\nLooking at the information in more detail, S1 is in the countryside to the north west of Garlsdon, but it is close to the residential area of the town. S2 is also close to the housing area, which surrounds the town centre.\n\nThere are main roads from Hindon, Bransdon and Cransdon to Garlsdon town centre, but this is a no traffic zone, so there would be no access to S2 by car. By contrast, S1 lies on the main road to Hindon, but it would be more difficult to reach from Bransdon and Cransdon. Both supermarket sites are close to the railway that runs through Garlsdon from Hindon to Cransdon.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_217": {
"question": "The diagram below shows how the Australian Bureau of Meteorology collects up-to-the-minute information on the weather in order to produce reliable forecasts.\n\nWrite a report for a university lecturer describing the information shown below. \n\nYou should write at least 150 words.v2_217_0.png",
"answer": "The figure illustrates the process used by the Australian Bureau of Meteorology to forecast the weather.\n\nThere are four stages in the process, beginning with the collection of information about the weather. This information is then analysed, prepared for presentation, and finally broadcast to the public.\n\nLooking at the first and second stages of the process, there are three ways of collecting weather data and three ways of analysing it. Firstly, incoming information can be received by satellite and presented for analysis as a satellite photo. The same data can also be passed to a radar station and presented on a radar screen or synoptic chart. Secondly, incoming information may be collected directly by radar and analysed on a radar screen or synoptic chart. Finally, drifting buoys also receive data which can be shown on a synoptic chart.\n\nAt the third stage of the process, the weather broadcast is prepared on computers. Finally, it is delivered to the public on television, on the radio, or as a recorded telephone announcement.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v1"
},
"v2_218": {
"question": "How much did I pay for tax?\nWhere is the information?v2_218_0.pngv2_218_1.pngv2_218_2.png",
"answer": "In the first receipt, you paid $3.72 for tax. The information is located at the bottom of the receipt. In the second receipt, you paid $42.23 for tax. The information is located near the bottom of the receipt, under the line of \"Sales Tax\". In the third receipt, you paid $4.58 for tax. The information is located at the bottom of the receipt, under the line of \"TAX\". Overall, you paid $50.53 in tax across all three receipts.",
"capability": [
"ocr",
"spat",
"math",
"seq",
"gen"
],
"added_in": "v2"
},
"v2_219": {
"question": "How much should I pay for the beer on the table according to the price on the menu?v2_219_0.pngHere is a photo of the menu.v2_219_1.png",
"answer": "12",
"capability": [
"rec",
"ocr",
"spat",
"math",
"seq"
],
"added_in": "v2"
},
"v2_220": {
"question": "Describe the image with a sentence consisting of three words.v2_219_0.png",
"answer": "Seaside dining table",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_221": {
"question": "Describe the image with a sentence consisting of six words.v2_219_0.png",
"answer": "Dining table overlooking ocean with beer",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_222": {
"question": "Describe the image with a sentence consisting of nine words.v2_219_0.png",
"answer": "Outdoor restaurant table with ocean view and a beer",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_223": {
"question": "Write a sentence for the image consisting only of words starting with the letter 'B'.v2_219_0.png",
"answer": "Beachside bar boasts beautiful blue backdrop.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_224": {
"question": "Write a sentence for the image consisting only of words starting with the letter 'D'.v2_219_0.png",
"answer": "Dining deck displays delightful drinks, distant docks.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_225": {
"question": "Write a sentence for the image consisting only of words starting with the letter 'T'.v2_219_0.png",
"answer": "Tabletop terrace teeming with tropical tranquility.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_226": {
"question": "What would the missing image look like?v2_226_0.png",
"answer": "star with a dot",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_227": {
"question": "Here are three sub images arranged in a 2-by-2 matrix. First, look at the two images in the first column, in the top left and bottom left. Then, find out the pattern in the first column based on the left two images. Next, use the found pattern and the image in the top right to infer the missing figure. Finally, describe what would the missing image look like?v2_226_0.png",
"answer": "star with a dot",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_228": {
"question": "Please read the text in this image and return the information in the following JSON format (note xxx is placeholder, if the information is not available in the image, put \"N/A\" instead).\n{\"class\": xxx, \"DLN\": xxx, \"DOB\": xxx, \"Name\": xxx, \"Address\": xxx, \"EXP\": xxx, \"ISS\": xxx, \"SEX\": xxx, \"HGT\": xxx, \"WGT\": xxx, \"EYES\": xxx, \"HAIR\": xxx, \"DONOR\": xxx}v2_228_0.png",
"answer": "{\"class\": \"D\", \"DLN\": \"D08954796\", \"DOB\": \"01/01/1974\", \"Name\": \"Jelani Sample\", \"Address\": \"123 Main St, Phoenix, AZ 85007\", \"EXP\": \"03/01/2024\", \"ISS\": \"03/01/2016\", \"SEX\": \"M\", \"HGT\": \"5-09\", \"WGT\": \"185 lbs\", \"EYES\": \"BRO\", \"HAIR\": \"BRO\", \"DONOR\": \"Y\"} ",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_229": {
"question": "Please read the text in this image and return the information in the following JSON format (note xxx is placeholder, if the information is not available in the image, put \"N/A\" instead).\n{\"class\": xxx, \"DLN\": xxx, \"DOB\": xxx, \"Name\": xxx, \"Address\": xxx, \"EXP\": xxx, \"ISS\": xxx, \"SEX\": xxx, \"HGT\": xxx, \"WGT\": xxx, \"EYES\": xxx, \"HAIR\": xxx, \"DONOR\": xxx}v2_229_0.png",
"answer": "{\"class\": \"C\", \"DLN\": \"I234568\", \"DOB\": \"08/31/1977\", \"Name\": \"Ima Cardholder\", \"Address\": \"2570 24th Street, Anytown, CA 95818\", \"EXP\": \"08/31/2014\", \"ISS\": \"08/31/2009\", \"SEX\": \"F\", \"HGT\": \"5-05\", \"WGT\": \"125 lbs\", \"EYES\": \"BRN\", \"HAIR\": \"BRN\", \"DONOR\": \"Y\"}",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_230": {
"question": "Please read the text in this image and return the information in the following JSON format (note xxx is placeholder, if the information is not available in the image, put \"N/A\" instead).\n{\"Surname\": xxx, \"Given Name\": xxx, \"USCIS #\": xxx, \"Category\": xxx, \"Country of Birth\": xxx, \"Date of Birth\": xxx, \"SEX\": xxx, \"Card Expires\": xxx, \"Resident Since\": xxx}v2_230_0.png",
"answer": "{\"Surname\": \"STEVENS\", \"Given Name\": \"ICHIKA\", \"USCIS #\": \"000-000-000\", \"Category\": \"IR1\", \"Country of Birth\": \"Japan\", \"Date of Birth\": \"18 AUG 1988\", \"SEX\": \"F\", \"Card Expires\": \"07/04/2027\", \"Resident Since\": \"07/05/2017\"} ",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_231": {
"question": "Count the number of apples in the image.v2_231_0.png",
"answer": "11",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_232": {
"question": "Describe the pointed region in the image.v2_232_0.png",
"answer": "hanging light",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_233": {
"question": "Describe the pointed region in the image.v2_233_0.png",
"answer": "The highlighted red region in the image is a table cell that contains a numeric value of 122.3 and is located in the \"test set\" section of the table, under the column \"out\" and the row \"GIT2\" This value represents the overall performance of the GIT2 method on the test set in the category \"out\".",
"capability": [
"ocr",
"spat",
"math",
"gen"
],
"added_in": "v2"
},
"v2_234": {
"question": "What is in the circled glass? Object 1 or 2?\nDescribe what is Object 1 and object 2. Then check what is in the circled glass.v2_234_0.png",
"answer": "Object 1 is a glass bottle of water. It is clear and has a blue label on it. Object 2 is a glass bottle of Magna beer. It is green and has a red and white label. In the circled glass it appears to be a clear liquid, likely water, so it is likely that the contents of the circled glass are from Object 1, the glass bottle of water.",
"capability": [
"rec",
"spat",
"gen"
],
"added_in": "v2"
},
"v2_235": {
"question": "Answer the question in the following figure. Provide intermediate steps.v2_235_0.png",
"answer": "To find the length of the blue arrowed edge, we can use the Pythagorean theorem since we have a right triangle. According to the theorem stating that a\u00b2 + b\u00b2 = c\u00b2, where a and b are the two legs of the right triangle and c is the hypotenuse, we can plug in the values we have, and get:\n4\u00b2 + 8\u00b2 = c\u00b2 16 + 64 = c\u00b2 80 = c\u00b2 \u221a80 = c 8.94 \u2248 c Therefore, the length of the blue arrowed edge is approximately 8.94.\nTo find the angle at the green arrow, we can use the tangent function since we have the opposite and adjacent sides of the angle. The tangent function states that tan\u03b8 = opposite/adjacent. Plugging in the values we have, we get: tan\u03b8 = 4/8 tan\u03b8 = 1/2 \u03b8 = tan^-1(1/2) \u03b8 \u2248 26.57\u00b0 Therefore, the angle at the green arrow is approximately 26.57\u00b0.",
"capability": [
"rec",
"ocr",
"spat",
"math"
],
"added_in": "v2"
},
"v2_236": {
"question": "Find out the pattern in the first column, and use it to infer the missing figure in the second column.v2_236_0.pngFor example, the circled region in the first left column shows the pattern of adding a line through it. Therefore, the answer is a figure of a diamondv2_236_1.pngwith a line through it, looking likev2_236_2.png. Answer the question in the following figure.v2_226_0.pngv2_236_4.png",
"answer": "Option cImage c",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_237": {
"question": "Find out the pattern in the first column, and use it to infer the missing figure in the second column. v2_237_0.pngFor example,v2_237_1.pngTherefore, adds a line to image 2v2_236_1.pngwill be a diamond with a line through it. 1.v2_237_3.png2.v2_237_4.png3.v2_237_5.png4. Here are three sub images arranged in a 2-by-2 matrix. What is the pattern between image 3 and image 1? What would be the next image to complete the matrix? a.v2_237_6.pngb.v2_237_7.pngc.v2_237_8.pngd.v2_237_9.pnge.v2_237_10.pngf.v2_237_11.png",
"answer": "Option cImage c",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_238": {
"question": "What is the read of the speed meter?v2_238_0.png",
"answer": "10",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v2"
},
"v2_239": {
"question": "What is the read of the speed meter? To read this speed meter, observe the needle on the outer edge of the dial which points to your current speed represented in miles per hour. Yellow is the color of the needle.v2_238_0.png",
"answer": "10",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v2"
},
"v2_240": {
"question": "What is the read of the speed meter?v2_240_0.pngThe yellow pointer is roughly at the middle between 80 and 100 mph. The middle between 80 and 100 is 90. The speed is around 91 mph, as the pointer is just passing 90 mph.v2_238_0.png",
"answer": "10",
"capability": [
"rec",
"ocr",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_241": {
"question": "What is the read of the speed meter?v2_241_0.pngThe yellow pointer is at the long tick between 20 and 40 mph. The long tick at the middle between 20 and 40 is 30. The speed is around 29 mph, as the pointer is close to 30 mph but not quite 30 yet.v2_238_0.png",
"answer": "10",
"capability": [
"rec",
"ocr",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_242": {
"question": "What is the read of the speed meter?v2_240_0.pngThe yellow pointer is roughly at the middle between 80 and 100 mph. The middle between 80 and 100 is 90. The speed is around 91 mph, as the pointer is just passing 90 mph.v2_241_0.pngThe yellow pointer is at the long tick between 20 and 40 mph. The long tick at the middle between 20 and 40 is 30. The speed is around 29 mph, as the pointer is close to 30 mph but not quite 30 yet.v2_238_0.png",
"answer": "10",
"capability": [
"rec",
"ocr",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_243": {
"question": "In the graph, which year has the highest average gas price for the month of June?v2_243_0.png",
"answer": "2022",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v2"
},
"v2_244": {
"question": "Describe the imagev2_244_0.png",
"answer": "The image shows a collage of 8 prominent personalities from various fields. On the top row, from left to right, there is singer Justin Bieber, footballer Lionel Messi, footballer Cristiano Ronaldo, and entrepreneur Elon Musk. On the bottom row, from left to right, there is model and reality TV star Kylie Jenner, singer Taylor Swift, actor Robert Downey Jr., and actor Scarlett Johansson. All individuals are shown in different poses and outfits, with various backgrounds.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_245": {
"question": "Who is the person in the image and what is the person doing?v2_245_0.png",
"answer": "Joe Biden",
"capability": [
"rec",
"know"
],
"added_in": "v2"
},
"v2_246": {
"question": "Who is the person in the image and what is the person doing?v2_246_0.jpg",
"answer": "Jensen Huang",
"capability": [
"rec",
"know"
],
"added_in": "v2"
},
"v2_247": {
"question": "Describe the landmark in the image.v2_247_0.jpg",
"answer": "The landmark in this image is the Space Needle, an observation tower in Seattle, Washington, 605 feet tall and offers panoramic views of the city and surrounding areas. The tower was built for the 1962 World's Fair and has since become a symbol of Seattle and a popular tourist attraction. The tower has a futuristic design with a large circular observation deck at the top and a restaurant that rotates 360 degrees. The base of the tower is surrounded by a park with trees and green spaces.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_248": {
"question": "Describe the landmark in the image.v2_248_0.jpg",
"answer": "This image shows the Kinkaku-ji temple in Kyoto, Japan, also known as the Golden Pavilion, a three-story Buddhist temple covered in gold leaf, that sits on a pond, creating a stunning reflection on the water. The surrounding landscape is filled with trees and rocks, creating a serene and peaceful atmosphere. It is a popular tourist attraction and designated National Special Historic Site.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_249": {
"question": "Describe the landmark in the image.v2_249_0.jpg",
"answer": "The landmark in the image is the statue of George M. Cohan in Times Square, New York City. It is a bronze statue that stands on a granite pedestal in Duffy Square which is the northern part of Times Square and is a tribute to George M. Cohan, an American entertainer, playwright, composer and producer. The statue was unveiled in 1959 and has since become a popular tourist attraction in Times Square.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_250": {
"question": "Describe the landmark in the image.v2_250_0.jpg",
"answer": "The landmark in the image is the famous Lombard Street in San Francisco, California known for its steep hairpin turns, the street is lined with colorful flowers and shrubbery and there are houses and buildings on both sides, in the background you can see the city skyline and the Coit Tower on Telegraph Hill, and it is often considered one of the most crooked streets in the world.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_251": {
"question": "Describe the landmark in the image.v2_251_0.jpg",
"answer": "The landmark in the image is Taipei 101 building, in Taipei, Taiwan. This building is rated with a height of 508 meters (1,667 feet) and has 101 floors above ground and 5 floors below ground, and is a popular tourist attraction in Taipei. The design of the building resembles a bamboo plant, symbolizing strength and resilience.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_252": {
"question": "Describe the landmark in the image.v2_252_0.jpg",
"answer": "The landmark in the image is the Manhattan Bridge, seen from the DUMBO neighborhood in Brooklyn, New York. The bridge spans the East River and connects Lower Manhattan with Brooklyn. It is a suspension bridge with two large towers and was completed in 1909. In the image, the bridge is framed by two brick buildings, creating a unique view of the landmark.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_253": {
"question": "Describe the landmark in the image.v2_253_0.jpg",
"answer": "The landmark in the image is the interior of Trump Tower in New York City. The focal point is the Trump Grill, a restaurant on the lower level of the tower, with red and gold accents, marble walls and columns and a festive holiday display featuring a Christmas tree and poinsettias. The space is opulent and luxurious, typical of the Trump brand.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_254": {
"question": "Describe the landmark in the image.v2_254_0.jpg",
"answer": "The landmark in the image is the Fushimi Inari Taisha Shrine in Kyoto, Japan, known for its thousands of vermilion gate gates that line the paths leading up to the shrine, and are donated by individuals and businesses to show their devotion to the inari deity. The gates represent the boundary between the secular world and the sacred world. The image shows a path lined with these gates leading up to the shrine, with stone steps in the center.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_255": {
"question": "Describe the name of the dish.v2_255_0.png",
"answer": "The dish on the photo is a bowl of Mapo Tofu, a popular Chinese dish from the Sichuan Province consists of soft tofu cubes in a rich and spicy sauce of chili peppers, fermented bean paste and Sichuan peppercorns garnished with thin slices of green onions.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_256": {
"question": "Describe the name of the dish.v2_256_0.jpg",
"answer": "Unagi Donburi is the name of the dish that originates from Japan and is typically a type of rice bowl dish eaten in a deep bowl. The word means freshwater eel in Japanese and refers to a large bowl with rice and other toppings. Unagi Donburi is a dish made with grilled eel and a type of sweet and savory sauce called \u201cunagi sauce\u201d served over white rice.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_257": {
"question": "Describe the name of the dish.v2_257_0.jpg",
"answer": "This dish is called a Cajun Sampler, which consists of four small bowls of traditional Cajun dishes -- gumbo, jambalaya, red beans and rice and crawfish \u00e9touff\u00e9e. The bowls are served with a side of sliced bread for dipping. Each bowl is filled with white rice and topped with green onions. It is a popular dish in Louisiana and a great way to try a variety of Cajun flavors.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_258": {
"question": "Describe the name of the dish.v2_258_0.jpg",
"answer": "This dish is called Braised Short Rib with Chimichurri and features a succulent short rib that has been slow cooked until tender and topped with a flavorful chimichurri sauce. It is served with roasted vegetables for a complete meal.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_259": {
"question": "Describe the imagev2_259_0.png",
"answer": "The image is a black and white X-ray of a human skull viewed from the front with the top and bottom of the skull clearly visible; the teeth and jaw bones are also visible but not as clear; the nasal cavity and eye sockets are also visible with an \u201cL\u201d on the bottom right corner, indicating that it is the left side of the skull.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_260": {
"question": "Are there wisdom teeth that needs to be removed in this x-ray image?v2_259_0.png",
"answer": "Yes",
"capability": [
"rec",
"know",
"spat"
],
"added_in": "v2"
},
"v2_261": {
"question": "Which wisdom tooth is hardest to remove?v2_259_0.png",
"answer": "lower and impacted wisdom teeth",
"capability": [
"rec",
"know",
"spat"
],
"added_in": "v2"
},
"v2_262": {
"question": "What\u2019s wrong?v2_262_0.png",
"answer": "There appears to be a fracture or break in the fifth metatarsal bone (the bone on the outside of the foot that connects with the pinky toe) ; this is commonly known as the \"Jonges Fracture \".",
"capability": [
"rec",
"know",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_263": {
"question": "Look at the CT scan of lung in the image below, tell me what's wrong.v2_263_0.png",
"answer": "There appears to be multiple areas of consolidation and ground-glass opacities in both lungs, which could indicate lung infection or inflammation and there is a possible mass or nodule in the right upper lobe. Further evaluation and clinical correlation is needed to determine the exact diagnosis.",
"capability": [
"rec",
"know",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_264": {
"question": "Describe the imagev2_264_0.png",
"answer": "The image is composed of three different icons arranged horizontally with a thin vertical line separating each icon : On the left is an icon that looks like the letter O with a blue horizontal line running through the middle ; on the right is an icon composed of two overlapping triangles with points that point upwards ; on the right is an icon of a shield-like shape with three arrows pointing upwards ; this is the logo of the automobile brand Maserati.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_265": {
"question": "Describe the logos in detailsv2_264_0.png",
"answer": "The Leftmost is BMW\u2019s logo. It is a circle icon filled with black color. Inside the circle, there is a blue horizontal line running through the middle. The area above the blue line is white and the area below the blue line is light blue. This logo represents a spinning propeller of an airplane, which is a nod to the company\u2019s history in aviation.\nThe middle one is the Infiniti logo. It is composed of two overlapping triangles, with the points facing upward. The triangles are filled in with black color. The logo represents a mountain or a road, which is a nod to the company\u2019s ethos of power, strength, and performance.\nThe rightmost one is the Maserati logo, which is composed of a shield-like shape and has three red arrows pointing upward. The shield shape is filled in with a faint white color, and the area between the arrows is black. This logo is a nod to the company\u2019s history in racing, with the arrows representing the company\u2019s victories.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_266": {
"question": "Describe both the image and logo in detailsv2_266_0.jpg",
"answer": "The image is of a McDonald\u2019s french fry container, filled with golden brown french fries. The red container has the iconic McDonald\u2019s \u201cM\u201d logo on it. The bright yellow background makes the red container and fries stand out.\nThe logo is the McDonald\u2019s \u201cM\u201d which is a large golden arch, forming the letter \u201cM\u201d for McDonald\u2019s. It is one of the most recognized logos in the world and is often associated with the fast food chain.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_267": {
"question": "Describe both the image and logo in detailsv2_267_0.jpg",
"answer": "The image shows two Starbucks cups. One is a clear plastic cup with a lid and straw, and the other is a white paper cup with a lid. The clear plastic cup contains a cold drink with ice and whipped cream on top, while the white paper cup contains a hot drink. The cups are placed on a wooden table with a blurred background of a Starbucks store.\nThe logo on the cups is the Starbucks logo, a green circle with a white mermaid or siren in the center.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_268": {
"question": "Describe both the image and logo in detailsv2_268_0.jpg",
"answer": "The image shows a woman in traditional Japanese clothing standing in front of the Olympic rings logo, wearing a purple kimono with a floral pattern and a red Obi belt, smiling and posing for the photo. The symbol is composed of five interlocking rings of different colors: blue, yellow, black, green, and red. The rings are arranged in such a way that they form a flower-like shape. The logo is displayed on a grassy area with trees in the background. ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_269": {
"question": "Describe both the image and logo in detailsv2_269_0.jpg",
"answer": "The image shows two wet Coca-Cola bottles lying on a bed of ice cubes, indicating they are chilled and ready to drink. The bottle on the left is a new grip bottle, as mentioned on the label. The bottle on the right is a regular Coca-Cola bottle. Both bottles have the iconic Coca-Cola logo on them.\nThe logo is written in a cursive font in white color, with a red background. The first \"C\" in Coca is larger than the rest of the letters, and the \"o\" in Cola is elongated. The logo is instantly recognizable and is synonymous with the brand. ",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v2"
},
"v2_270": {
"question": "Describe both the image and logo in detailsv2_270_0.jpg",
"answer": "The image shows a close-up of a person\u2019s foot wearing a white Nike Air Force 1 sneaker. The shoe is a low-top style with a white rubber sole and white laces. The upper of the shoe is made of textured white leather to give it a premium look.\nThe logo shown on the sneaker is the iconic Nike Swoosh. It is displayed on the side of the shoe in a silver color. The Swoosh is a curved, elongated checkmark shape with a pointed tip at the end. It represents speed and motion, embodying the brand\u2019s athletic and sporty aesthetic.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_271": {
"question": "Describe both the image and logo in detailsv2_271_0.jpg",
"answer": "The image is a screenshot from a presentation about Microsoft 365 Copilot. The image shows a man standing in front of a large screen with the Microsoft 365 Copilot logo and some text on it. The man is wearing a blue sweater and is gesturing with his hands as he speaks. The background is a modern-looking set with a green plant and a gray wall.\nThe logo for Microsoft 365 Copilot is a square with rounded corners. The background of the logo is white, and the text \"Microsoft 365 Copilot\" is written in black. The center of the logo is a colorful shape resembling a cube with three sides visible. The colors of the shape are blue, purple, and pink, and the shape is slightly tilted to the right. The logo is simple and modern, with a clean and professional look. ",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v2"
},
"v2_272": {
"question": "Describe the imagev2_272_0.png",
"answer": "The image is a screenshot of a dashcam taken from inside a car showing the view of the road ahead: The car is driving on a two-lane road with a speed limit sign of 35 mph visible on the right side of the road, trees on both sides of the road and the sky is filled with dark clouds, suggesting that it could soon rain; orange cones are visible on the left side of the road indicating a construction zone; and in the distance there is a bridge overpass.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_273": {
"question": "Describe the imagev2_273_0.png",
"answer": "The image is a view of a road from the perspective of a car dashboard camera. The road has two lanes, and the car is in the right lane behind a silver vehicle. Two yellow signs on the side of the road warn drivers of an upcoming pedestrian crossing and a curve to the left. The sky is cloudy and gray, and trees and bushes line the sides of the road. ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_274": {
"question": "Can you find the red ball near the gray cat in the image?v2_274_0.png",
"answer": "No",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_275": {
"question": "Can you see the bright blue feathers on the bird's wing?v2_275_0.png",
"answer": "No",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_276": {
"question": "Can you spot the pink elephant playing in the corner?v2_276_0.png",
"answer": "No",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_277": {
"question": "Can you find the baseball player wearing a blue shirt?v2_277_0.png",
"answer": "No",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_278": {
"question": "Try to locate a large waterfall behind the trees.v2_278_0.png",
"answer": "No",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_279": {
"question": "Can you find the blue lighting fixture mounted to the ceiling?v2_279_0.png",
"answer": "No",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_280": {
"question": "Count the number of apples in the image.v2_280_0.jpg",
"answer": "7",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_281": {
"question": "Count the number of apples in the image.v2_281_0.jpg",
"answer": "16",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_282": {
"question": "Count the number of oranges in the image.v2_282_0.jpg",
"answer": "3",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_283": {
"question": "Count the number of people in the image.v2_283_0.jpg",
"answer": "3",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_284": {
"question": "Count the number of people in the image.v2_284_0.jpg",
"answer": "4",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_285": {
"question": "Count the number of people in the image.v2_285_0.jpg",
"answer": "10",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_286": {
"question": "Localize each person in the image using bounding box. The image size is (width, height) = (512,403)v2_286_0.png",
"answer": "There is only one person in the image with the bounding box:\n- Top left: (151, 38)\n- Bottom right: (309, 403)",
"capability": [
"rec",
"spat",
"gen"
],
"added_in": "v2"
},
"v2_287": {
"question": "Localize each car in the image using bounding box. What is the image size of the input image?v2_287_0.jpg",
"answer": "The image size of the input image is 144 x 144 pixels.\nBounding box for the black car:\n- Top left corner: (11, 75)\n- Bottom right corner: (49, 101)\nBounding box for the white car:\n- Top left corner: (77, 73)\n- Bottom right corner: (141, 105)",
"capability": [
"rec",
"spat",
"gen"
],
"added_in": "v2"
},
"v2_288": {
"question": "Localize each person in the image using bounding box. What is the image size of the input image?v2_288_0.jpg",
"answer": "The image size of the input image is 512 x 195 pixels.\nBounding boxes for each person:\n- Person 1 (leftmost): (x1, y1) = (99, 48), (x2, y2) = (163, 160)\n- Person 2: (x1, y1) = (158, 47), (x2, y2) = (217, 153)\n- Person 3: (x1, y1) = (289, 40), (x2, y2) = (336, 162)\n- Person 4: (x1, y1) = (319, 47), (x2, y2) = (387, 169)\n- Person 5 (rightmost): (x1, y1) = (467, 46), (x2, y2) = (512, 152)",
"capability": [
"rec",
"spat",
"gen"
],
"added_in": "v2"
},
"v2_289": {
"question": "Please follow the instructions\n1. Tell me the size of the input image;\n2. Localize each person in the image using bounding box;\n3. Recognize each person;\n4. Generate detailed caption for each bounding box.v2_284_0.jpg",
"answer": "1. The size of the input image is 512 x 384 pixels.\n2. Bounding box 1: (x1, y1) = (120, 250), (x2, y2) = (420, 950) - Person 1\nBounding box 2: (x1, y1) = (500, 240), (x2, y2) = (800, 940) - Person 2\nBounding box 3: (x1, y1) = (880, 230), (x2, y2) = (1180, 930) - Person 3\nBounding box 4: (x1, y1) = (1260, 220), (x2, y2) = (1560, 920) - Person 4\n3. Person 1: Yann LeCun\nPerson 2: Geoffrey Hinton\nPerson 3: Yoshua Bengio\nPerson 4: Andrew Ng\n4. Caption for bounding box 1: Yann LeCun, computer scientist and one of the founding fathers of artificial intelligence.\nCaption for bounding box 2: Geoffrey Hinton, computer scientist and cognitive psychologist, known for his work on artificial neural networks.\nCaption for bounding box 3: Yoshua Bengio, computer scientist and co-founder of the Montreal Institute for Learning Algorithms.\nCaption for bounding box 4: Andrew Ng, computer scientist and entrepreneur, known for his work on deep learning and artificial intelligence. ",
"capability": [
"rec",
"know",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_290": {
"question": "Compare the average kinetic energies of the particles in each sample. The diagrams below show two pure samples of gas in identical closed, rigid containers. Each colored ball represents one gas particle. Both samples have the same number of particles. Which sample has the higher temperature? Sample A or sample B?v2_290_0.png",
"answer": "A",
"capability": [
"rec",
"know",
"spat"
],
"added_in": "v2"
},
"v2_291": {
"question": "Which of these states is farthest north?v2_291_0.png",
"answer": "Delaware",
"capability": [
"rec",
"spat",
"ocr",
"know"
],
"added_in": "v2"
},
"v2_292": {
"question": "Which of the organisms is the producer in this food web?v2_292_0.png",
"answer": "berries and flowers, grasses, and seeds",
"capability": [
"ocr",
"spat",
"know"
],
"added_in": "v2"
},
"v2_293": {
"question": "Suppose you are a teacher, please use the figure to explain the distinction between evaporation and evapotranspiration.v2_293_0.jpg",
"answer": "Okay, class, today we will learn about the distinction between evaporation and evapotranspiration. Let\u2019s take a look at this figure.\nFirst, let\u2019s understand what evaporation is. Evaporation is the process by which water is changed from its liquid state to its gaseous state. This usually occurs at a liquid's surface, like the ocean or a lake, when the water molecules gain enough energy to break away and form water vapor. So in this figure, we can see that the water in the lake and the dam is evaporating and becoming water vapor.\nNow, let\u2019s take a look at evapotranspiration. This is a combination of two processes - evaporation and transpiration. Transpiration is the process by which plants release water vapor through their leaves. So, in this figure, we can see that the trees and plants are releasing water vapor into the air, which is the transpiration part of evapotranspiration. At the same time, the water in the soil and the surface is also evaporating. This combination of evaporation and transpiration is what we call evapotranspiration.\nIn summary, evaporation is the process by which water is changed from its liquid state to its gaseous state, while evapotranspiration is the combination of evaporation and transpiration. Both these processes contribute to the water cycle and are essential for maintaining the balance of water in our environment.",
"capability": [
"rec",
"know",
"gen",
"ocr"
],
"added_in": "v2"
},
"v2_294": {
"question": "What is [person3] doing?v2_294_0.png",
"answer": "carrying a plate of food",
"capability": [
"rec",
"spat",
"ocr",
"know",
"gen"
],
"added_in": "v2"
},
"v2_295": {
"question": "What are [person1] and [person2] doing?v2_295_0.png",
"answer": "walking down the aisle at a wedding ceremony",
"capability": [
"rec",
"spat",
"ocr",
"know",
"gen"
],
"added_in": "v2"
},
"v2_296": {
"question": "Suppose you are a detective, what can you infer from the visual clues in the image?v2_296_0.jpg",
"answer": "From the visual clues in the image, I can infer that:\n- The room belongs to someone who is likely a young adult or teenager, as evidenced by the casual clothing and the desk with a computer.\n- The person is likely a student or works from home, as evidenced by the desk and computer.\n- The person is likely fashion-conscious, as evidenced by the multiple jackets and shoes.\n- The room is likely in a colder climate, as evidenced by the jackets and boots.\n- The person is likely not very tidy, as evidenced by the cluttered desk and the clothes hanging on the door.\n- The room is likely located in an older or more rustic building, as evidenced by the exposed pipes and the worn-looking walls. ",
"capability": [
"rec",
"gen",
"know"
],
"added_in": "v2"
},
"v2_297": {
"question": "What are all the scene text in the image?v2_297_0.png",
"answer": "3,642,039,031,055",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_298": {
"question": "What are all the scene text in the image?v2_298_0.png",
"answer": "- (NVDA)\n- NVIDIA\n- 356.85\n- +51.47\n- +16.85%",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_299": {
"question": "What are all the scene text in the image?v2_299_0.png",
"answer": "- \"Royal\"\n- \"London\" ",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_300": {
"question": "What are all the scene text in the image?v2_300_0.png",
"answer": "The Earth without art is just 'eh'",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_301": {
"question": "What are all the scene text in the image?v2_301_0.jpg",
"answer": "The Road to Hollywood: how some of us got here",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_302": {
"question": "What are all the scene text in the image?v2_302_0.png",
"answer": "- \"Westfield\"\n- \"westfield.com.au\" ",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_303": {
"question": "What are all the scene text in the image?v2_303_0.jpg",
"answer": "-1) \u201cCOVID-19 TESTING\u201d\n-2) \u201cPLEASE HAVE ID & INSURANCE CARD READY\u201d\n-3) \u201cW @UW Medicine\u201d (this is the logo/branding for the University of Washington Medicine",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_304": {
"question": "What are all the scene text in the image?v2_304_0.png",
"answer": "- Vacation\n- Beach\n- Smile\n- Summer\n- Watermelon\n- Flip flops\n- Lemonade",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_305": {
"question": "What are all the scene text in the image?v2_305_0.jpg",
"answer": "- Malayan Tapir\n- Tapirus indicus\n- LOCATION: Malay Peninsula and Sumatra, near water\n- RELATIVES: There are only five species of tapirs. They are most closely related to horses and rhinos.\n- VANISHING? The forest provides tapirs with shelter, food, and water, but forests are rapidly disappearing in Malaysia and Sumatra. ",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_306": {
"question": "What is the value of x in the image?v2_306_0.png",
"answer": "5",
"capability": [
"rec",
"ocr",
"math"
],
"added_in": "v2"
},
"v2_307": {
"question": "Explain the figurev2_307_0.png",
"answer": "This figure represents a flow chart of a team\u2019s proposal process. The process begins with a team member suggesting a project in a meeting. The team then discusses whether it is a good idea or not. If the concept is not considered good, the team rejects it, and the process ends.\nIf the team thinks it might be a good idea but needs more information, a team member conducts further research and refines the concept into a proposal. The team then reviews the proposal and provides feedback. If the proposal is not okay, then the team member revises it and the team reviews it again.\nIf the proposal is okay, the team sends it to a final decision-making process. If the proposal is approved, then the team proceeds with the project. This is the end of the proposal process.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_308": {
"question": "Can you translate the flowchart to a python code?v2_308_0.jpg",
"answer": "num1 = input(\"Enter first number: \") num2 = input(\"Enter second number: \") if num1 > num2: print(num1) else: print(num2)",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_309": {
"question": "Explain the figure.v2_309_0.png",
"answer": "The figure is a graph that shows the relationship between the quality of a paper and its impact on a person's career. The x-axis represents the quality of the paper, which ranges from bad to creative and original. The y-axis represents the paper's impact on a person's career, ranging from nothing to lots of impact.\nThe graph shows that a lousy paper has little to no impact on a person's career, while a creative and original paper has a significant impact. The impact of the paper on a person's career increases as the quality of the paper improves. This suggests that the quality of a person's work is an essential factor in determining their success in their career. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_310": {
"question": "How many families are earning more than 13000 and owns more than 2 cars?v2_310_0.png",
"answer": "113",
"capability": [
"ocr",
"spat",
"math"
],
"added_in": "v2"
},
"v2_311": {
"question": "Describe the image.v2_311_0.png",
"answer": "This image is a floor plan for an apartment or condominium, the layout of the rooms and dimensions: there is a terrace, dining room, fayer, two bedrooms, master bathroom and a guest bathroom. The floor plan is black and white, and is a two-dimensional drawing.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_312": {
"question": "Where is the bathroom for the second bedroom?v2_311_0.png",
"answer": "According to this floor plan, the second bedroom's bathroom appears to be directly adjacent to the bedroom. It is labeled \"WC\" and is a small room measuring 5'2\" x 5'2\".",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_313": {
"question": "Answer the question in the image.v2_313_0.png",
"answer": "```Layer | Number on figure 1\n--- | ---\nOuter core | 3\nMantle | 2\nCrust | 1\nInner core | 4 ```",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_314": {
"question": "Describe the poster. Which city is this dish from?v2_314_0.jpg",
"answer": "The poster promotes a Chinese dish known as \"Hot Dry Noodles.\" The poster features a red background with white Chinese characters at the top that reads \"Hot dry noodles, the taste of China.\" Below the text is a photo of the dish, which includes noodles with meat and vegetables on top. The dish is served in a green bowl with red chili peppers on the side. The text at the bottom of the poster, written in Chinese, describes the dish as spicy, fragrant, and delicious.\nThis particular dish originates from Wuhan, which is located in the Hubei Province of China. It is a famous street food in the city and is considered one of the \"10 Great Breakfasts\" in China.",
"capability": [
"rec",
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_315": {
"question": "This is a paper \"Paper Gestalt.\" Describe the paper in details and highlight their contribution.\nPage 1v2_315_0.pngPage 2v2_315_1.pngPage 3v2_315_2.pngPage 4v2_315_3.pngPage 5v2_315_4.png",
"answer": "The paper \"Paper Gestalt\" is a research paper written by Carven von Bearnensquash from the Department of Computer Science at the University of Phoenix. The paper discusses the visual quality of a computer science research paper and how it affects the overall impression of the paper.\nThe paper begins with an introduction to the concept of paper gestalt, which is the overall impression of a paper. The author argues that the visual quality of a paper is an essential factor in creating a good impression. The paper then discusses previous work in this area. It highlights the contribution of this paper, which is the use of a supervised learning algorithm to evaluate the visual quality of a paper.\nThe paper then presents the methodology and experimental results. The author collected a dataset of 1861 computer science research papers and used a supervised learning algorithm to evaluate the visual quality of the papers. The algorithm was trained on a set of features extracted from the papers, such as the number of figures and the number of equations. The results showed that the algorithm could accurately predict the visual quality of a paper with a high degree of accuracy.\nThe paper concludes with a discussion of the results and future work. The author suggests that future work could focus on improving the algorithm by incorporating more features and training it on a larger dataset. The paper also indicates that the algorithm could be used to evaluate the visual quality of other types of documents, such as technical reports and dissertations.\nOverall, the contribution of this paper is the use of a supervised learning algorithm to evaluate the visual quality of a computer science research paper. This novel approach could help researchers improve the visual quality of their papers and make a better impression on their readers. ",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_316": {
"question": "\u63cf\u8ff0\u9019\u5f35\u5716\u7247v2_316_0.jpg",
"answer": "\u9019\u5f35\u5716\u7247\u662f\u4e00\u96bb\u5c0f\u8c93\u5728\u8349\u5730\u4e0a\u8d70\u8def\u7684\u756b\u9762\u3002\u5c0f\u8c93\u662f\u6a58\u8272\u7684\uff0c\u6709\u85cd\u8272\u7684\u773c\u775b\uff0c\u770b\u8d77\u4f86\u5f88\u53ef\u611b\u3002\u5b83\u7684\u8eab\u9ad4\u5f88\u5c0f\uff0c\u56db\u80a2\u7e96\u7d30\uff0c\u6b63\u5728\u5c0f\u5fc3\u7ffc\u7ffc\u5730\u5728\u8349\u5730\u4e0a\u884c\u8d70\u3002",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_317": {
"question": "D\u00e9crire l\u2019imagev2_316_0.jpg",
"answer": "Il s\u2019agit d\u2019une photo d\u2019un chaton roux marchant sur l\u2019herbe verte. Le chaton a les yeux bleus et semble \u00eatre en train de marcher avec prudence. Il est entour\u00e9 d\u2019herbe et on peut voir une partie d\u2019un autre chat en arri\u00e8re-plan.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_318": {
"question": "Popi\u0161te obr\u00e1zekv2_316_0.jpg",
"answer": "Na obr\u00e1zku je mal\u00e9 oran\u017eov\u00e9 kot\u011b s modr\u00fdma o\u010dima. Kot\u011b stoj\u00ed na zelen\u00e9 tr\u00e1v\u011b a sm\u011b\u0159uje dop\u0159edu. Jeho t\u011blo je v pohybu a vypad\u00e1, \u017ee pr\u00e1v\u011b b\u011b\u017e\u00ed. Na pozad\u00ed je vid\u011bt dal\u0161\u00ed \u010d\u00e1st tr\u00e1vy a nejasn\u011b i dal\u0161\u00ed ko\u010dka. ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_319": {
"question": "Describe the image in Chinesev2_319_0.jpg",
"answer": "\u8fd9\u662f\u4e00\u53ea\u5c0f\u67ef\u57fa\u72ac\uff0c\u5b83\u5728\u8349\u5730\u4e0a\u8d70\u7740\uff0c\u5634\u5df4\u5f20\u5f00\uff0c\u820c\u5934\u4f38\u51fa\u6765\uff0c\u597d\u50cf\u5f88\u5f00\u5fc3\u7684\u6837\u5b50\u3002\u5b83\u7684\u8eab\u4e0a\u6709\u4e00\u6761\u9879\u5708\uff0c\u4e0a\u9762\u6302\u7740\u4e00\u4e2a\u9aa8\u5934\u5f62\u72b6\u7684\u724c\u5b50\u3002",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_320": {
"question": "Describe the image in Frenchv2_319_0.jpg",
"answer": "C'est une image d'un petit chien de race Corgi. Il est de couleur marron et blanc et porte un collier avec une m\u00e9daille en forme d'os. Il est en train de marcher sur l'herbe verte avec la langue pendante.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_321": {
"question": "Describe the image in Czechv2_319_0.jpg",
"answer": "Na obr\u00e1zku je mal\u00fd hn\u011bd\u00fd pes s b\u00edl\u00fdm l\u00edmcem a kosti\u010dkou na obojku. Pes je na zelen\u00e9 tr\u00e1v\u011b a m\u00e1 otev\u0159enou tlamu. Vypad\u00e1, \u017ee se bav\u00ed. ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_322": {
"question": "Describir la imagen en 20 idiomas diferentesv2_322_0.jpg",
"answer": "1. Ingl\u00e9s: This is a beautiful view of Machu Picchu in Peru. \n2. Espa\u00f1ol: Esta es una hermosa vista de Machu Picchu en Per\u00fa.\n3. Franc\u00e9s: C'est une belle vue de Machu Picchu au P\u00e9rou. 4. Alem\u00e1n: Dies ist eine sch\u00f6ne Aussicht auf Machu Picchu in Peru. \n5. Italiano: Questa \u00e8 una bella vista di Machu Picchu in Per\u00f9. \n6. Portugu\u00e9s: Esta \u00e9 uma bela vista de Machu Picchu no Peru. \n7. Ruso: \u042d\u0442\u043e \u043a\u0440\u0430\u0441\u0438\u0432\u044b\u0439 \u0432\u0438\u0434 \u043d\u0430 \u041c\u0430\u0447\u0443-\u041f\u0438\u043a\u0447\u0443 \u0432 \u041f\u0435\u0440\u0443. \n8. Chino: \u8fd9\u662f\u79d8\u9c81\u9a6c\u4e18\u6bd4\u4e18\u7684\u7f8e\u4e3d\u666f\u8272\u3002 \n9. Japon\u00e9s: \u3053\u308c\u306f\u30da\u30eb\u30fc\u306e\u30de\u30c1\u30e5\u30d4\u30c1\u30e5\u306e\u7f8e\u3057\u3044\u666f\u8272\u3067\u3059\u3002 \n10. Coreano: \uc774\uac83\uc740 \ud398\ub8e8\uc758 \ub9c8\ucd94 \ud53c\ucd94\uc758 \uc544\ub984\ub2e4\uc6b4 \uacbd\uce58\uc785\ub2c8\ub2e4. \n11. Hindi: \u092f\u0939 \u092a\u0947\u0930\u0942 \u0915\u0947 \u092e\u093e\u091a\u0942 \u092a\u093f\u091a\u094d\u091a\u0942 \u0915\u093e \u0938\u0941\u0902\u0926\u0930 \u0926\u0943\u0936\u094d\u092f \u0939\u0948\u0964 \n12. \u00c1rabe: \u0647\u0630\u0627 \u0645\u0646\u0638\u0631 \u062c\u0645\u064a\u0644 \u0644\u0645\u0627\u0634\u0648 \u0628\u064a\u062a\u0634\u0648 \u0641\u064a \u0628\u064a\u0631\u0648. \n13. Turco: Bu, Peru'daki Machu Picchu'nun g\u00fczel bir manzaras\u0131d\u0131r. \n14. Griego: \u0391\u03c5\u03c4\u03ae \u03b5\u03af\u03bd\u03b1\u03b9 \u03bc\u03b9\u03b1 \u03cc\u03bc\u03bf\u03c1\u03c6\u03b7 \u03b8\u03ad\u03b1 \u03c4\u03bf\u03c5 \u039c\u03ac\u03c4\u03c3\u03bf\u03c5 \u03a0\u03af\u03c4\u03c3\u03bf\u03c5 \u03c3\u03c4\u03bf \u03a0\u03b5\u03c1\u03bf\u03cd. \n15. Hebreo: \u05d6\u05d4\u05d5 \u05e0\u05d5\u05e3 \u05d9\u05e4\u05d4 \u05e9\u05dc \u05de\u05d0\u05e6'\u05d5 \u05e4\u05d9\u05e6'\u05d5 \u05d1\u05e4\u05e8\u05d5. \n16. Sueco: Det h\u00e4r \u00e4r en vacker vy av Machu Picchu i Peru. \n17. Noruego: Dette er en vakker utsikt over Machu Picchu i Peru. \n18. Dan\u00e9s: Dette er en smuk udsigt over Machu Picchu i Peru. \n19. Holand\u00e9s: Dit is een prachtig uitzicht op Machu Picchu in Peru. \n20. Polaco: To pi\u0119kny widok na Machu Picchu w Peru. ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_323": {
"question": "What are all the scene text in the image?v2_323_0.jpg",
"answer": "\u0628\u0633\u0645 \u0627\u0644\u0644\u0647 \u0627\u0644\u0631\u062d\u0645\u0646 \u0627\u0644\u0631\u062d\u064a\u0645",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_324": {
"question": "What are all the scene text in the image?v2_324_0.png",
"answer": "MUSEE DU LOUVRE",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_325": {
"question": "What are all the scene text in the image?v2_325_0.jpg",
"answer": "\u5c16\u6c99\u5480Tsim Sha Tsui",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_326": {
"question": "What are all the scene text in the image?v2_326_0.jpg",
"answer": "WELCOMEbienvenidaBienvenueWillkommenbenvenuto",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_327": {
"question": "What are all the scene text in the image?v2_327_0.jpg",
"answer": "SUPER NINTENDO WORLD\u30b9\u30fc\u30d1\u30fc\u30cb\u30f3\u30c6\u30f3\u30c9\u30fc\u30ef\u30fc\u30eb\u30c9",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_328": {
"question": "What are all the scene text in the image?v2_328_0.png",
"answer": "G.P. FIM DA EUROPAATLETISMOAnt\u00f3nio Agostinho 1987Fernando Domingos 1988",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_329": {
"question": "What are all the scene text in the image?v2_329_0.jpg",
"answer": "\u0391\u0398\u0397\u039d\u0391\u0399-\u03a1\u03a9\u039c\u0397-\u03a1\u0399\u039f\u039d \u0399\u0391\u039d\u0395\u03aa\u03a1\u039f\u039d29 \u039c\u0391\u03aa\u039f\u03a5 1933\u0394\u03a1\u0391\u03a7\u0395\u039b\u039b\u0391\u03a3\u03a3\u03a0\u0391\u0395\u03a1. \u03a4\u0391\u03a7\u03a5\u0394\u03a1. \u03a3\u03a5\u0393\u039a\u039f\u0399\u039d. \u0399\u03a4\u0391\u039b\u0399\u0391\u03a3-\u0395\u039b\u039b\u0391\u0394\u039f\u03a3-\u03a4\u039f\u03a5\u03a1\u039a\u0399\u0391\u03a3120",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_330": {
"question": "What are all the scene text in the image?v2_330_0.jpg",
"answer": "n\u00e3o \u00e9 normal ter medo de andar sozinho na rua!!!",
"capability": [
"ocr"
],
"added_in": "v2"
},
"v2_331": {
"question": "If the image is presented in a language other than English, translate the content to English.v2_331_0.png",
"answer": "The text in the image is in Japanese and translates to \"Good morning, have a nice day.\" ",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_332": {
"question": "If the image is presented in a language other than English, translate the content to English.v2_332_0.png",
"answer": "The text in the image is in Chinese and translates to \"Mapo Tofu.\"",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_333": {
"question": "If the image is presented in a language other than English, translate the content to English.v2_333_0.png",
"answer": "The text in the image is in Korean and translates to \"Delicious food\". ",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_334": {
"question": "If the image is presented in a language other than English, translate the content to English.v2_334_0.png",
"answer": "The text in the image is in Korean and translates to \"ANGELUS\n1st Great Classified Growth\n\nCHATEAU\nANGELUS\n1996\n\nSaint-Emilion Great Growth\nSaint-Emilion Appellation Controlled\"",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_335": {
"question": "If the image is presented in a language other than English, translate the content to English.v2_335_0.png",
"answer": "English translation: \"Pictures [edit | edit wikitext] Stegosaurus's brain was located in its small head.\" ",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_336": {
"question": "If the image is presented in a language other than English, translate the content to English.v2_336_0.png",
"answer": "The content in the image is in Portuguese and translates to \"Double tap to add a title. Double tap to add a subtitle.\" ",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_337": {
"question": "Summarize the info in 20 languages.v2_337_0.png",
"answer": "1. English: The Southern Alps are a mountain range in New Zealand. \n2. Spanish: Los Alpes del Sur son una cadena monta\u00f1osa en Nueva Zelanda. \n3. French: Les Alpes du Sud sont une cha\u00eene de montagnes en Nouvelle-Z\u00e9lande. \n4. German: Die S\u00fcdalpen sind ein Gebirgszug in Neuseeland. \n5. Italian: Le Alpi meridionali sono una catena montuosa in Nuova Zelanda. \n6. Portuguese: Os Alpes do Sul s\u00e3o uma cordilheira na Nova Zel\u00e2ndia. \n7. Russian: \u042e\u0436\u043d\u044b\u0435 \u0410\u043b\u044c\u043f\u044b - \u0433\u043e\u0440\u043d\u044b\u0439 \u0445\u0440\u0435\u0431\u0435\u0442 \u0432 \u041d\u043e\u0432\u043e\u0439 \u0417\u0435\u043b\u0430\u043d\u0434\u0438\u0438. \n8. Chinese: \u5357\u963f\u5c14\u5351\u65af\u5c71\u8109\u662f\u65b0\u897f\u5170\u7684\u4e00\u6761\u5c71\u8109\u3002 \n9. Japanese: \u5357\u30a2\u30eb\u30d7\u30b9\u306f\u30cb\u30e5\u30fc\u30b8\u30fc\u30e9\u30f3\u30c9\u306e\u5c71\u8108\u3067\u3059\u3002 \n10. Korean: \ub0a8\ubd80 \uc54c\ud504\uc2a4\ub294 \ub274\uc9c8\ub79c\ub4dc\uc758 \uc0b0\ub9e5\uc785\ub2c8\ub2e4. \n11. Hindi: \u0926\u0915\u094d\u0937\u093f\u0923\u0940 \u090f\u0932\u094d\u092a\u094d\u0938 \u0928\u094d\u092f\u0942\u091c\u0940\u0932\u0948\u0902\u0921 \u0915\u093e \u090f\u0915 \u092a\u0930\u094d\u0935\u0924 \u0936\u094d\u0930\u0943\u0902\u0916\u0932\u093e \u0939\u0948\u0964 \n12. Bengali: \u09a6\u0995\u09cd\u09b7\u09bf\u09a3 \u0985\u09cd\u09af\u09be\u09b2\u09aa\u09b8 \u09a8\u09bf\u0989\u099c\u09bf\u09b2\u09cd\u09af\u09be\u09a8\u09cd\u09a1\u09c7\u09b0 \u098f\u0987 \u0985\u09a7\u09bf\u0995 \u09aa\u09b0\u09cd\u09ac\u09a4\u09ae\u09be\u09b2\u09be\u0964 \n13. Arabic: \u0627\u0644\u0623\u0644\u0628 \u0627\u0644\u062c\u0646\u0648\u0628\u064a\u0629 \u0647\u064a \u0633\u0644\u0633\u0644\u0629 \u062c\u0628\u0627\u0644 \u0641\u064a \u0646\u064a\u0648\u0632\u064a\u0644\u0646\u062f\u0627. \n14. Turkish: G\u00fcney Alpler Yeni Zelanda'da bir da\u011f silsilesidir. \n15. Indonesian: Alpen Selatan adalah sebuah pegunungan di Selandia Baru. \n16. Vietnamese: D\u00e3y n\u00fai Alpes ph\u00eda Nam l\u00e0 m\u1ed9t d\u00e3y n\u00fai \u1edf New Zealand. \n17. Thai: \u0e40\u0e17\u0e37\u0e2d\u0e01\u0e40\u0e02\u0e32\u0e41\u0e2d\u0e25\u0e1b\u0e4c\u0e20\u0e32\u0e04\u0e43\u0e15\u0e49\u0e40\u0e1b\u0e47\u0e19\u0e40\u0e17\u0e37\u0e2d\u0e01\u0e40\u0e02\u0e32\u0e43\u0e19\u0e19\u0e34\u0e27\u0e0b\u0e35\u0e41\u0e25\u0e19\u0e14\u0e4c \n18. Malay: Alpen Selatan adalah satu rangkaian gunung di New Zealand. \n19. Tagalog: Ang Timog Alps ay isang hanay ng mga bundok sa New Zealand. \n20. Swahili: Milima ya Alpi Kusini ni safu ya milima nchini New Zealand.",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_338": {
"question": "Describe the image in both English and the local language corresponding to the geolocation depicted in the image.v2_338_0.png",
"answer": "English: This image shows a couple dressed in traditional Chinese wedding attire, sitting in front of a wall of red roses and a gold Chinese character for \"double happiness.\"\nChinese (Simplified): \u8fd9\u5f20\u56fe\u7247\u5c55\u793a\u4e86\u4e00\u5bf9\u7a7f\u7740\u4e2d\u56fd\u4f20\u7edf\u5a5a\u793c\u670d\u88c5\u7684\u592b\u5987\uff0c\u5750\u5728\u7ea2\u8272\u73ab\u7470\u548c\u91d1\u8272\u201c\u53cc\u559c\u201d\u6c49\u5b57\u524d\u9762\u3002 (Zh\u00e8 zh\u0101ng t\u00fapi\u00e0n zh\u01censh\u00ecle y\u012b du\u00ec chu\u0101nzhe zh\u014dnggu\u00f3 chu\u00e1nt\u01d2ng h\u016bnl\u01d0 f\u00fazhu\u0101ng de f\u016bf\u00f9, zu\u00f2 z\u00e0i h\u00f3ngs\u00e8 m\u00e9igu\u012b h\u00e9 j\u012bns\u00e8 \"shu\u0101ng x\u01d0\" h\u00e0nz\u00ec qi\u00e1nmi\u00e0n.) ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_339": {
"question": "Describe the image in both English and the local language corresponding to the geolocation depicted in the image.v2_339_0.png",
"answer": "English: The image shows a couple wearing traditional Ethiopian clothing, standing in a garden with a tree in the background. The woman is wearing a white dress with colorful patterns and the man is wearing a white suit with similar patterns.\nAmharic (Ethiopia's official language): \u12ed\u1205 \u121d\u1235\u120d \u1260\u12a2\u1275\u12ee\u1335\u12eb\u12ca \u1263\u1205\u120d \u120d\u1265\u1235 \u12e8\u1208\u1260\u1231\u1275 \u1263\u1208\u1264\u1275\u1293 \u1263\u1208\u1264\u1275\u1295 \u1260\u1308\u1263\u122d \u12ed\u1273\u12eb\u120d\u1362 \u1234\u1275\u12ee\u1271 \u1260\u1290\u133b\u1290\u1275 \u12eb\u1209 \u12a0\u1208\u1263\u1208\u1263\u1205\u122d \u120d\u1265\u1236\u127d \u1208\u1260\u1233\u1208\u127d \u12a5\u1293 \u12c8\u1295\u12f5\u12ee\u1271\u121d \u1260\u1218\u1233\u1233\u1205 \u12a0\u1208\u1263\u1208\u1263\u1205\u122d \u1231\u1275 \u1208\u1260\u1233\u1208\u127d\u1362 ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_340": {
"question": "Describe the image in both English and the local language corresponding to the geolocation depicted in the image.v2_340_0.png",
"answer": "English: This image shows a Japanese couple in traditional wedding attire. The man is wearing a black kimono with a white hakama and the woman is wearing a white kimono with a large headpiece.\nJapanese: \u3053\u306e\u753b\u50cf\u306f\u4f1d\u7d71\u7684\u306a\u7d50\u5a5a\u5f0f\u306e\u8863\u88c5\u3092\u7740\u305f\u65e5\u672c\u306e\u30ab\u30c3\u30d7\u30eb\u3092\u793a\u3057\u3066\u3044\u307e\u3059\u3002\u7537\u6027\u306f\u767d\u3044\u88b4\u3068\u9ed2\u3044\u7740\u7269\u3092\u7740\u3066\u304a\u308a\u3001\u5973\u6027\u306f\u5927\u304d\u306a\u982d\u98fe\u308a\u3068\u767d\u3044\u7740\u7269\u3092\u7740\u3066\u3044\u307e\u3059\u3002 (Kono gaz\u014d wa dent\u014d-teki na kekkon-shiki no ish\u014d o kita Nihon no kappuru o shimeshiteimasu. Dansei wa shiroi hakama to kuroi kimono o kite ori, josei wa \u014dkina kazari to shiroi kimono o kiteimasu.) ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_341": {
"question": "Describe the image in both English and the local language corresponding to the geolocation depicted in the image.v2_341_0.png",
"answer": "English: This image shows a newlywed Indian couple sharing a kiss. The bride is wearing a traditional red sari and the groom is wearing a red turban and white suit. They are sitting on a decorated stage with flowers.\nHindi (local language in India): \u092f\u0939 \u091b\u0935\u093f \u090f\u0915 \u0928\u0935\u0935\u093f\u0935\u093e\u0939\u093f\u0924 \u092d\u093e\u0930\u0924\u0940\u092f \u091c\u094b\u0921\u093c\u0947 \u0915\u094b \u090f\u0915 \u091a\u0941\u0902\u092c\u0928 \u0936\u0947\u092f\u0930 \u0915\u0930\u0924\u0947 \u0939\u0941\u090f \u0926\u093f\u0916\u093e\u0924\u0940 \u0939\u0948\u0964 \u0926\u0941\u0932\u094d\u0939\u0928 \u090f\u0915 \u092a\u0930\u0902\u092a\u0930\u093e\u0917\u0924 \u0932\u093e\u0932 \u0938\u093e\u0921\u093c\u0940 \u092a\u0939\u0928 \u0930\u0939\u0940 \u0939\u0948 \u0914\u0930 \u0926\u0942\u0932\u094d\u0939\u093e \u090f\u0915 \u0932\u093e\u0932 \u092a\u0917\u0921\u093c\u0940 \u0914\u0930 \u0938\u092b\u0947\u0926 \u0938\u0942\u091f \u092a\u0939\u0928 \u0930\u0939\u093e \u0939\u0948\u0964 \u0935\u0947 \u092b\u0942\u0932\u094b\u0902 \u0938\u0947 \u0938\u091c\u0947 \u0939\u0941\u090f \u090f\u0915 \u092e\u0902\u091a \u092a\u0930 \u092c\u0948\u0920\u0947 \u0939\u0948\u0902\u0964",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_342": {
"question": "Generate latex codev2_342_0.jpg",
"answer": "$a^2 + b^2 = c^2$",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_343": {
"question": "Generate latex codev2_343_0.jpg",
"answer": "$\\sum_{i=0}^{N} (i^2 + i + 1)^{0.5}$",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_344": {
"question": "Generate latex codev2_344_0.jpg",
"answer": "$y = \\int f(x,y) \\,dx$",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_345": {
"question": "Generate latex codev2_345_0.png",
"answer": "$\\P(x \neq 6) = c \\times 5 \\sum_{i=1}^{N} (i \\times (i + 1)) + y_s \\int_{a}^{b} f(x,y) \\,dx$",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_346": {
"question": "Please read the table in this image and return a markdown-style reconstructed table in text.v2_346_0.png",
"answer": "```| Country | Sales Volume | Revenue | Profit |\n| --- | --- | --- | --- |\n| USA | 40.080 | $15.971.880 | $3.086.421 |\n| China | 35.070 | $15.866.670 | $3.032.162 |\n| Australia | 27.054 | $14.812.566 | $2.868.636 |\n| India | 23.046 | $10.608.174 | $1.853.710 |\n| South Korea | 16.032 | $10.494.948 | $1.975.844 |```",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_347": {
"question": "Please read the table in this image and return a latex-style reconstructed table in text.v2_346_0.png",
"answer": "Here is the reconstructed table in latex:\n```\\begin{tabular},{|c|c|c|c|} \\hline \nCountry & Sales Volume & Revenue & Profit \\\\ \\hline \nUSA & 40.080 & \\$15.971.880 & \\$3.086.421 \\\\ \\hline \nChina & 35.070 & \\$15.866.670 & \\$3.032.162 \\\\ \\hline \nAustralia & 27.054 & \\$14.812.566 & \\$2.868.636 \\\\ \\hline \nIndia & 23.046 & \\$10.608.174 & \\$1.853.710 \\\\ \\hline\nSouth Korea & 16.032 & \\$10.494.948 & \\$1.975.844 \\\\ \\hline\n\\end{tabular}```",
"capability": [
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_348": {
"question": "Generate python code to draw similar curves.v2_348_0.png",
"answer": "``` import matplotlib.pyplot as plt\n import numpy as np\n # Sample data points for the x-axis (number of images in millions)\n x = np.array([1, 10, 100, 1000])\n # Sample data points for the y-axis (CIDEr scores)\n y_base = np.array([50, 70, 85, 100])\n y_large = np.array([60, 80, 100, 120])\n y_huge = np.array([70, 90, 110, 140])\n # Plotting the curves\n plt.figure(figsize=(6, 4))\n plt.plot(x, y_base, 'b-*', label='Base')\n plt.plot(x, y_large, 'r-x', label='Large')\n plt.plot(x, y_huge, 'g-o', label='Huge')\n # Setting the x-axis to be logarithmic\n plt.xscale('log')\n # Adding titles and labels\n plt.title('Model performance as a function of pre-training dataset size')\n plt.xlabel('Million images in pre-training')\n plt.ylabel('CIDEr')\n # Adding a legend\n plt.legend()\n # Adding grid\n # Display the plot\n plt.show()```",
"capability": [
"rec",
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_349": {
"question": "Write python codes to generate similar figures.v2_349_0.png",
"answer": "``` import matplotlib.pyplot as plt\n # Task names and performance scores\n tasks = ['Caption', 'VQA', 'TR', 'IR', 'NLVR2']\n OSCaR_scores = [122, 72, 95, 90, 78]\n OSCaR_proportion = [100, 94, 100, 100, 100]\n MiniVLM_scores = [120, 70, 90, 85, 72]\n MiniVLM_proportion = [97, 96, 95, 95, 94]\n bar_width = 0.35 # width of the bars\n # Set position of bar on X axis\n r1 = np.arange(len(tasks))\n r2 = [x + bar_width for x in r1]\n # Make the plot\n plt.bar(r1, OSCaR_scores, color='blue', width=bar_width, label='OSCaR')\n plt.bar(r2, MiniVLM_scores, color='red', width=bar_width, label='MiniVLM (ours)')\n # Add text on top of the bars\n for i in range(len(tasks)):\n plt.text(r1[i], OSCaR_scores[i] + 3, f'{OSCaR_proportion[i]}%', ha='center', color='black')\n plt.text(r2[i], MiniVLM_scores[i] + 3, f'{MiniVLM_proportion[i]}%', ha='center', color='black')\n # Add xticks on the middle of the group bars\n plt.xlabel('Tasks', fontweight='bold')\n plt.xticks([r + bar_width / 2 for r in range(len(tasks))], tasks)\n # Create legend & Show graphic\n plt.legend()\n plt.show()```",
"capability": [
"rec",
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_350": {
"question": "Generate the following image in tikz.v2_350_0.png",
"answer": "```\\documentclass[tikz,border=10pt]{standalone}\n\\begin{document}\n\\begin{tikzpicture}\n % Body\n \\draw [fill=pink] (0,0) ellipse (3cm and 2cm);\n % Head\n \\draw [fill=pink] (2.5,0.5) circle (1cm);\n % Eyes\n \\draw [fill=white] (2.7,0.7) circle (0.2cm);\n \\draw [fill=black] (2.7,0.7) circle (0.1cm);\n % Nose\n \\draw [fill=pink] (3,0.3) ellipse (0.3cm and 0.2cm);\n \\draw (2.9,0.3) -- (3.1,0.3);\n % Ears\n \\draw [fill=pink] (2.2,1.2) ellipse (0.5cm and 0.3cm);\n \\draw [fill=pink] (3,1.5) ellipse (0.5cm and 0.3cm);\n % Legs\n \\draw [fill=pink] (-1.5,-1.5) circle (0.5cm);\n \\draw [fill=pink] (-0.5,-1.7) circle (0.5cm);\n \\draw [fill=pink] (0.5,-1.7) circle (0.5cm);\n \\draw [fill=pink] (1.5,-1.5) circle (0.5cm);\n % Tail\n \\draw [pink, thick] (1,-1) to [out=90,in=180] (1.5,-0.5) to [out=0,in=180] (2,-1);\n\\end{tikzpicture}\n\\end{document}```",
"capability": [
"rec",
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_351": {
"question": "Describe the pointed region in the image.v2_351_0.png",
"answer": "The pointed region in the image is a green glass bottle of Magna beer with a red label and a gold cap, sitting on a black table surrounded by other items like a water bottle, napkins, and umbrellas.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_352": {
"question": "Describe the pointed region in the image.v2_352_0.png",
"answer": "The pointed region in the image is a green beer bottle with a red label that says \"MAGNA\". The bottle is standing upright on a black table with a white napkin next to it.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_353": {
"question": "Describe the pointed region in the image.v2_353_0.png",
"answer": "The pointed region in the image contains a white folded napkin and a silverware set wrapped in another white napkin placed on a black table. This is likely a table setting for a meal at a restaurant.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_354": {
"question": "Describe the pointed region in the image.v2_354_0.png",
"answer": "The pointed region in the image is a section of a wooden railing with vertical slats, which is located at the edge of a patio overlooking the ocean. The railing appears to be white and is partially obscured.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_355": {
"question": "Describe the two pointed objects in the image.v2_355_0.png",
"answer": "The first pointed object (indicated by the yellow arrow) is a white patio umbrella, which has a pointed top and is attached to a metal pole. The umbrella is open and provides shade for the outdoor seating area. The second pointed object (indicated by the red arrow) is a green glass bottle of Magna beer. The bottle has a pointed neck and is capped with a gold-colored metal lid. It is sitting on a black table in front of a white napkin.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_356": {
"question": "Describe the pointed region in the image.v2_232_0.png",
"answer": "The pointed region in the image is a row of hanging lights on a wire. The lights are small and round and evenly spaced along the wire. The wire is stretched between two poles and above a patio area with tables and umbrellas. The lights appear decorative and are likely used to provide ambient lighting in the evening.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_357": {
"question": "Locate the region based on given coordinates and describe the contents in the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. Describe the relative position of region (0.47, 0.48, 0.55, 0.87) in the image. Describe the contents in that relative position. No need to mention contents in other part of the image.v2_219_0.png",
"answer": "The region (0.47, 0.48, 0.55, 0.87) is located in the center-right part of the image. It covers a small area of the table and extends to the bottom of the image. The most prominent object in this region is a green bottle of Magna beer. A white napkin and a part of a water bottle are also visible in this region. The background shows a part of the patio and the ocean.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_358": {
"question": "Locate the region based on given coordinates and describe the contents in the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. Describe the relative position of region (0.01, 0.09, 0.29, 0.21) in the image. Describe the contents in that relative position. No need to mention contents in other part of the image.v2_219_0.png",
"answer": "The region (0.01, 0.09, 0.29, 0.21) is in the image's top left corner, covering approximately 28% of the width and 12% of the height of the image. In this region, there is a part of a white umbrella and a string of lights. The background shows a clear blue sky and a palm tree.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_359": {
"question": "Locate the region based on given coordinates and describe the contents in the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. Describe the relative position of region (0.01, 0.67, 0.36, 0.91) in the image. Describe the contents in that relative position. No need to mention contents in other part of the image.v2_219_0.png",
"answer": "The region (0.01, 0.67, 0.36, 0.91) in the image is located at the bottom left corner, covering approximately one-third of the width and one-fourth of the height of the image. This region has a black table with a white napkin, a bottle of Magna beer, and a glass bottle of water. The table is in the foreground, while the background shows a part of the patio with white umbrellas and chairs.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_360": {
"question": "Locate the region based on given coordinates and describe the contents in the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. Describe the relative position of region (0.47, 0.48, 0.55, 0.87) in the image. Describe the contents in that relative position. No need to mention contents in other part of the image.v2_232_0.png",
"answer": "The region (0.47, 0.48, 0.55, 0.87) is located towards the right side of the image, slightly below the center. It covers a small portion of the table and the background. In this region, there is a green bottle of Magna beer on the table, with a white napkin next to it. In the background, there is a part of an umbrella and a few chairs.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_361": {
"question": "What is in the circled glass? Object 1 or object 2?\nDescribe what is Object 1 and object 2. Then check what is in the circled glass.v2_234_0.png",
"answer": "Object 1 is a glass bottle of water. It is clear and has a blue label on it.\nObject 2 is a glass bottle of Magna beer. It is green and has a red and white label on it.\nIn the circled glass, it appears to be a clear liquid, likely water. So, it is expected that the contents of the circled glass are from Object 1, the glass bottle of water.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_362": {
"question": "Which circled line shows a different comparison trend? Provide intermediate steps.v2_362_0.png",
"answer": "The circled line that shows a different comparison trend is the USNCO Local Section Exam 2022. Intermediate steps: 1. Analyze the data in the table and look for any discrepancies in the comparison trends. 2. Notice that in all the rows except for the USNCO Local Section Exam 2022, the GPT-4 (no vision) column has a lower score than the GPT-4 column. 3. This means that in all the other rows, the GPT-4 model with vision performed better than the GPT-4 model without vision. 4. However, in the USNCO Local Section Exam 2022 row, the GPT-4 (no vision) column has a higher score than the GPT-4 column. 5. This is a different comparison trend than the rest of the rows, indicating that the GPT-4 model without vision performed better than the GPT-4 model with vision in this exam.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_363": {
"question": "Answer questions in the following figure. Provide intermediate steps.v2_363_0.png",
"answer": "The next image in the sequence would be a star with a dot in the center. This is because the sequence appears to be following a pattern where the shape alternates between a diamond and a star, and a dot is added to the center of the shape every other image. Intermediate steps:\n- First, we can observe that the sequence alternates between a diamond and a star shape.\n- Next, we can see that a dot is added to the center of the shape in every other image.\n- Based on this pattern, we can predict that the next image will be a star with a dot in the center.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_364": {
"question": "What is the icon used for?v2_364_0.png",
"answer": "The circled icon in the image is a microphone icon that is used to activate the voice search feature on Bing : users can click on this icon and speak into their device microphone to ask a question or search for something instead of typing in it. This can be helpful for hands-free searching or for users who may have difficulty typing in.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_365": {
"question": "What does the pointed news talk about?v2_365_0.png",
"answer": "The pointed news is talking about the new feature of ChatGPT that allows users to create personalized instructions that are said to help users manage their conversations better and improve their experience with the chatbot.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_366": {
"question": "What does this part of the poster highlights?v2_366_0.png",
"answer": "This section of the poster presents the ReCo framework, which is the main contribution of this research. It explains the functionality of the framework and the goals it achieves. The ReCo framework is a text-to-image generation model, controlled by regions, that generates high-quality images based on descriptive text. It also describes the different components of the framework and how they interact with each other. The ReCo framework is designed to be flexible and easily extensible, and it has been shown to improve the quality of image generation and achieve better semantic consistency compared to other text-to-image generation techniques.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_367": {
"question": "What are the differences between these two experiments in the slides?v2_367_0.png",
"answer": "There are several key differences between the two experiments shown in the slides:\n1. Tasks: the first experiment (left side) focuses on a visual localization task, i.e., training the model to recognize and localize objects in an image. The second experiment (right side) focuses on the image captioning task, where the model is trained to generate descriptive captions for images. Dataset: the first experiment uses the Flickr30k Entities dataset, which contains images with annotated object bounding boxes. The second experiment uses the MSCOCO and VQA2 datasets, which contain images with relevant captions. Evaluation metrics: The first experiment uses an average accuracy metric to evaluate the performance of the model in a visual grounding task. In summary, these two experiments aim to evaluate the performance of the UniTAB model on different tasks and datasets, and to demonstrate its ability to handle multiple tasks using a single model.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_368": {
"question": "Locate the referred object and represent the location of the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. For example, the (x1,y1,x2,y2) coordinates for that region with the beer bottle is (0.47, 0.48, 0.55, 0.87).v2_219_0.pngFor the image below, what is the (x1,y1,x2,y2) coordinates for the region with the blue Subaru SUV?v2_368_1.png",
"answer": "(0.58, 0.64, 0.88, 0.93)",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_369": {
"question": "Locate the referred object and represent the location of the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. For example, the (x1,y1,x2,y2) coordinates for that region with the beer bottle is (0.47, 0.48, 0.55, 0.87).v2_219_0.pngFor the image below, what is the (x1,y1,x2,y2) coordinates for the region with objectv2_369_1.pngin it?v2_368_1.png",
"answer": "(0.37, 0.65, 0.55, 0.85)",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_370": {
"question": "Explain the images and the action the person is taking.v2_370_0.jpgv2_370_1.jpgv2_370_2.jpgv2_370_3.jpg",
"answer": "The images show a person in a motion capture suit in a studio with multiple cameras and sensors performing a push-up exercise. In the first image the person is in the starting position with his arms extended and their body in a straight line, in the second image the person is lowering their body towards the ground, in the third image the person is at the bottom of the push-up with their chest close to the ground, in the fourth image a person is pushing their body to its starting position.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_371": {
"question": "Analyze the images and decide the correct order in which they should be displayed.\nav2_371_0.jpgbv2_371_1.jpgcv2_371_2.jpgdv2_371_3.jpgev2_371_4.jpg",
"answer": "e,c,b,a,d",
"capability": [
"rec",
"seq"
],
"added_in": "v2"
},
"v2_372": {
"question": "For opening a door, decide the correct order in which they should be displayed.\nav2_372_0.pngbv2_372_1.pngcv2_372_2.png",
"answer": "a,b,c",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_373": {
"question": "For closing a door, decide the correct order in which they should be displayed.\nav2_372_0.pngbv2_372_1.pngcv2_372_2.png",
"answer": "c,b,a",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_374": {
"question": "Predict what will happen next based on the images.v2_374_0.pngv2_374_1.pngv2_374_2.png",
"answer": "Based on the images, it appears that the player in the white jersey is taking a penalty kick ; the next likely event is that the player will kick the ball towards the goal attempting to score ; the goalkeeper in the black jersey will try to block the shot.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_375": {
"question": "Analyze the images and decide what the next steps should be.v2_375_0.jpgv2_375_1.jpgv2_375_2.jpg",
"answer": "The following images depict the process of making sushi rolls. In the first image, rice is mixed with vinegar in a bowl. The second image shows the rice being spread onto a sheet of seaweed. The third image displays the addition of salmon and cucumber to the roll. Afterward, the sushi will need to be rolled using a bamboo mat, cut into smaller pieces, and served with soy sauce and wasabi.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_376": {
"question": "In which frame does the player kick the ball? Did the goalkeeper block the ball?\nav2_374_0.pngbv2_374_1.pngcv2_374_2.pngdv2_376_3.pngev2_376_4.pngfv2_376_5.png",
"answer": "The player kicks the ball in frame c. The ball was not blocked by the goalkeeper, as it can be seen in frame f that the ball is in the net and the goalkeeper is on the ground.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_377": {
"question": "Describe and summarize what the circled person doing?v2_377_0.pngv2_377_1.pngv2_377_2.png",
"answer": "In the first image, we see a man standing next to a bench, seemingly engaged in a conversation with another man who is sitting on the bench. In the second image, the man who was standing is pointing toward something, and in the third image, he appears to be playfully pretending to punch the other man. Overall, it seems like the man standing is having a friendly conversation and joking around with the man sitting on the bench.",
"capability": [
"rec",
"gen",
"seq",
"spat"
],
"added_in": "v2"
},
"v2_378": {
"question": "Summarize the activities of the person.v2_378_0.pngv2_378_1.pngv2_378_2.png",
"answer": "The person sitting on the bench stands up and adjusts their shirt.",
"capability": [
"rec",
"gen",
"seq",
"spat"
],
"added_in": "v2"
},
"v2_379": {
"question": "A tangram is a geometric puzzle that consists of seven flat pieces to form shapes. Here are ten abstract tangram. Which one best illustrates a flying goose? What do other figures look like?\n1.v2_379_0.png2.v2_379_1.png3.v2_379_2.png4.v2_379_3.png5.v2_379_4.png6.v2_379_5.png7.v2_379_6.png8.v2_379_7.png9.v2_379_8.png10.v2_379_9.png",
"answer": "The tangram puzzle has 10 pieces, each representing a different object. Piece number 7 resembles a flying goose with its triangular body and wings, while the smaller triangle on top can be seen as the head and neck. The other pieces can represent the following objects: \n1. Rocket or tower\n2. Butterfly or bat\n3. Question mark or snake\n4. Person or robot\n5. Mountain range or crown\n6. House or temple\n7. Flying goose (as mentioned above)\n8. Bird or fish\n9. Boat or hat\n10. Dog or fox.\nI hope that helps!",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_380": {
"question": "Here is an abstract figure. Can you identify how many characters are there, and the cartoon from which they originate?v2_380_0.png",
"answer": "In this abstract figure, four characters come from the South Park cartoon starring Eric Cartman, Kyle Broflovski, Stan Marsh and Kenny McCormick.",
"capability": [
"rec",
"gen",
"know"
],
"added_in": "v2"
},
"v2_381": {
"question": "A tangram is a geometric puzzle that consists of seven flat pieces to form shapes. Locate the referred object and represent the location of the region. Regions are represented by (x1,y1,x2,y2) coordinates. x1 x2 are the left and right most positions, normalized into 0 to 1, where 0 is the left and 1 is the right. y1 y2 are the top and bottom most positions, normalized into 0 to 1, where 0 is the top and 1 is the bottom. For example, the (x1,y1,x2,y2) coordinates for that region with the beer bottle is (0.47, 0.48, 0.55, 0.87).v2_219_0.pngThe image below that shows a flying goose. Which part represents the head of the bird? What is the (x1,y1,x2,y2) coordinates for the region with the head of the bird?v2_379_6.png",
"answer": "(0.42, 0.15, 0.58, 0.35)",
"capability": [
"rec",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_382": {
"question": "What is the highlighted part?v2_382_0.png",
"answer": "head of the goose",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_383": {
"question": "How are those visual parts related, and can they be combined to form a single object such as a boy? If so, how to arrange them?v2_383_0.pngv2_383_1.pngv2_383_2.png",
"answer": "The three visual components are interrelated in that they can be combined to form a single object, in this case, a boy. To create the boy, we can assemble the parts in the following manner: \n- The first image, the cardboard with orange and green shapes, can be used to make the body of the boy. \n- The second image, the pair of jeans, can be used to form the legs of the boy.\n- The third image, the cardboard with yellow, red, and blue shapes, can be used to create the head of the boy.\n By arranging these components together, we can form a single object that closely resembles a boy.",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_384": {
"question": "Which one of the five is least like the other four?\na.v2_384_0.pngb.v2_384_1.pngc.v2_384_2.pngd.v2_384_3.pnge.v2_384_4.png",
"answer": "d",
"capability": [
"rec",
"seq"
],
"added_in": "v2"
},
"v2_385": {
"question": "Which one of the five designs makes the best comparison?v2_385_0.pnga.v2_385_1.pngb.v2_385_2.pngc.v2_385_3.pngd.v2_385_4.pnge.v2_385_5.png",
"answer": "c",
"capability": [
"rec",
"know",
"seq"
],
"added_in": "v2"
},
"v2_386": {
"question": "Find out the pattern in the first column and use it to infer the missing figure in the second column.v2_386_0.png",
"answer": "upside-down triangle",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v2"
},
"v2_387": {
"question": "Find out the pattern in the first two rows and use it to infer the missing figure in the third row.v2_387_0.png",
"answer": "C",
"capability": [
"rec",
"ocr",
"spat"
],
"added_in": "v2"
},
"v2_388": {
"question": "1.v2_388_0.png2.v2_236_1.png3.v2_388_2.png4.Here are three sub images arranged in a 2-by-2 matrix. Figure out which figure of a to f that should logically replace the missing figure. What would be the next image to complete the matrix?\na.v2_388_3.pngb.v2_236_2.pngc.v2_388_5.pngd.v2_388_6.pnge.v2_388_7.pngf.v2_388_8.pngThe first image in the first column, image 1, is a triangle. The first image in the second column, image 3, is a triangle with a line through it. The second image in the first column, image 2, is a diamond. Therefore, the second image in the second column, image 4 should continue this pattern and be a diamond with a line through it. Option b is the only image that fits this pattern, as it is a diamond with a line through it. Therefore, the correct answer is b.\n1.v2_237_3.png2.v2_237_4.png3.v2_237_5.png4. Here are three sub images arranged in a 2-by-2 matrix. Figure out which figure of a to f that should logically replace the missing figure. What would be the next image to complete the matrix?a.v2_237_6.pngb.v2_237_7.pngc.v2_237_8.pngd.v2_237_9.pnge.v2_237_10.pngf.v2_237_11.png",
"answer": "c",
"capability": [
"rec",
"seq"
],
"added_in": "v2"
},
"v2_389": {
"question": "Identify and read emotions of people from their faces as shown in the image below.v2_389_0.png",
"answer": "sad",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_390": {
"question": "Identify and read emotions of people from their faces as shown in the image below.v2_390_0.png",
"answer": "fearful",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_391": {
"question": "Identify and read emotions of people from their faces as shown in the image below.v2_391_0.png",
"answer": "happy",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_392": {
"question": "Identify and read emotions of people from their faces as shown in the image below.v2_392_0.png",
"answer": "fearful",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_393": {
"question": "After seeing the below image, how people might emotionally feel and react?v2_393_0.jpg",
"answer": "happycontentrelaxed",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_394": {
"question": "After seeing the below image, how people might emotionally feel and react?v2_394_0.jpg",
"answer": "angryfrustratedupset",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_395": {
"question": "After seeing the below image, how people might emotionally feel and react?v2_395_0.jpg",
"answer": "awe",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_396": {
"question": "After seeing the below image, how people might emotionally feel and react?v2_396_0.jpg",
"answer": "scaredanxiousuneasy",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_397": {
"question": "Aesthetics reflects the perceived beauty or visual appeal of an object, design, or piece of art by human.\nAmong the images provided below, based on societal standards and norms, which one more people will consider having a higher aesthetics?v2_397_0.jpgv2_397_1.jpg",
"answer": "second",
"capability": [
"rec",
"seq"
],
"added_in": "v2"
},
"v2_398": {
"question": "Aesthetics reflects the perceived beauty or visual appeal of an object, design, or piece of art by human.\nAmong the images provided below, based on societal standards and norms, which one more people will consider having a higher aesthetics?v2_398_0.jpgv2_398_1.jpg",
"answer": "first",
"capability": [
"rec",
"seq"
],
"added_in": "v2"
},
"v2_399": {
"question": "Describe the image in a humorous way.v2_399_0.jpg",
"answer": "It seems like the sun is attempting to hide behind the horizon, but it's not very successful. It's almost as if it's playing peek-a-boo with us. Meanwhile, the seaweed is just relaxing, as if to say, 'Don't mind us, we're just hanging out.' The rocks are probably feeling a bit neglected, wondering, 'What about us? We're also part of this beach!'",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_400": {
"question": "Describe the image to make people feel uneasy and anxious.v2_400_0.jpg",
"answer": "The image depicts a dimly lit staircase that appears dark and shadowy. The only source of light is a single, dim bulb that casts eerie shadows on the walls. The railing of the staircase is old, rusted, and has peeling paint with jagged edges. The stairs themselves are uneven and make creaking noises when stepped on. The air in the space is thick and musty, and there is a sense of unease as if someone is lurking in the shadows. The silence is deafening, and every creak and groan of the old staircase echoes through the space.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_401": {
"question": "Describe the image to lessen someone's desire to visit.v2_399_0.jpg",
"answer": "The image shows a rocky beach with seaweed and algae covering the ground; the water is murky and there are no clear areas to swim or relax, the rocks are sharp and slippery, making it difficult to walk or explore. The sunset is partially blocked by clouds making it seem like a difficult and unpleasant place to navigate",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_402": {
"question": "Describe the image to make people feel relax and comforting.v2_400_0.jpg",
"answer": "The image is a dimly lit staircase with ornate railings, the light is soft and creates a quiet atmosphere; the shadows on the wall add depth and texture to the image, making it feel cozy and inviting. The overall mood of the image is calm and peaceful, making it a perfect place to relax and unwind.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_403": {
"question": "Compare Image 1 and image 2, tell me about the differences between image 1 and image 2.\nImage 1v2_403_0.pngImage 2v2_403_1.png",
"answer": "1. The crown: in image 1, the crown is pink with a blue gem in the center. In image 2, the crown is gold with red gems and a cross on top.\n2. The dress: in image 1 the dress has a red bow in the center. In image 2, the bow is missing.\n3.The number of cuts: in image 1 the number is 6 while in image 2 the number is 5.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_404": {
"question": "Compare Image 1 and image 2, tell me about 3 differences between image 1 and image 2.\nImage 1v2_404_0.pngImage 2v2_404_1.png",
"answer": "1) In image 1, the color of the coral reef on the right is blue while in Image 2, the color is red. \n2) In image 1, there is a small red coral reef in the middle. In image 2, there is a green plant in the middle. \n3) In image 1, the turtle\u2019s head is facing downwards. In image 2 the turtle\u2019s head is facing upwards.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_405": {
"question": "Compare Image 1 and image 2, tell me about the 3 differences between image 1 and image 2.\nImage 1v2_405_0.pngImage 2v2_405_1.png",
"answer": "1) In image 1, there is no sun in the background, while in image 2, there is a sun in the top left corner.\n2) In image 1, there is a single bamboo leaf on the ground, while in image 2, there is a small brown pile on the ground.\n3) In image 1, the panda is holding three bamboo leaves, while in image 2, the panda is holding a bamboo stalk.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_406": {
"question": "Compare Image 1 and image 2, tell me about 3 differences between image 1 and image 2.\nImage 1v2_406_0.pngImage 2v2_406_1.png",
"answer": "1) Image 1 has spikes on its back while image 2 does not.\n2) Image 2 has a tail while image 1 does not.\n3) Image 2 has eyelashes while image 1 does not.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_407": {
"question": "What is wrong with the object in the image?v2_407_0.png",
"answer": "There is a small hole in the object, which seems to be hazelnut, this could be a sign of insect damage or rot.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_408": {
"question": "What is wrong with the object in the image?v2_408_0.png",
"answer": "There is a tear or hole in the fabric, which is small in size.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_409": {
"question": "What is wrong with the object in the image?v2_409_0.png",
"answer": "The object in the image seems to be a screw or bolt with a damaged or stripped head The grooves in the head that would normally allow a screwdriver or wrench to grip and turn the screw are worn away and no longer work.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_410": {
"question": "What is wrong with the object in the image?v2_410_0.png",
"answer": "It is difficult to tell exactly what the object in the image is, but appears to be a car bumper or fender with a large dent in it, the problem with the object is that it is damaged and dented, which may affect the appearance and function of the car.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_411": {
"question": "What is wrong with the object in the image?v2_411_0.png",
"answer": "It appears that the copper wires in blue and brown sections are frayed and not neatly arranged, which may indicate damage or poor quality.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_412": {
"question": "What is wrong with the object in the image?v2_412_0.png",
"answer": "However, it appears there could be a crack on one of the edges of the object.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_413": {
"question": "What is wrong with the object in the image?v2_413_0.png",
"answer": "There is a small white mark on the orange part of the pill.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_414": {
"question": "What is wrong with the object in the image?v2_414_0.png",
"answer": "There is a small white spot on the lower left side of the inner circle.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_415": {
"question": "What is wrong with the object in the image?v2_415_0.png",
"answer": "Multiple defects can be observed in the image, including dirt on the wheel, damage to the outer edge of the rim, and signs of wear on the tire.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_416": {
"question": "Given Image 1, tell me what is wrong in image 2.\nImage 1v2_416_0.pngImage 2v2_413_0.png",
"answer": "In image 2 there is a small white mark on the orange part of the pill; this could be a defect or damage to the pill.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_417": {
"question": "Given Image 1, tell me what is wrong in image 2.\nImage 1v2_417_0.pngImage 2v2_414_0.png",
"answer": "In image 2 there is a small white spot on the lower left side of the inner circle, which could be a defect or damage on the surface of the object.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_418": {
"question": "Given image 1, tell me if there are any defects seen on the object in image 2?\nImage 1v2_418_0.pngImage 2v2_415_0.png",
"answer": "Yes, there are a few defects seen on the object in image 2:\n\n- There is a significant amount of dirt and grime on the wheel, which is not present in image 1.\n- There appears to be some damage to the outer edge of the rim, which is not present in image 1.\n- The tire tread appears to be more worn in image 2 than in image 1.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_419": {
"question": "How many people are wearing helmets?v2_419_0.png",
"answer": "5",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_420": {
"question": "Please determine whether the person in the image wears a helmet or not. And summarize how many people are wearing helmets.\nImage 1v2_420_0.pngImage 2v2_420_1.pngImage 3v2_420_2.pngImage 4v2_420_3.pngImage 5v2_420_4.pngImage 6v2_420_5.pngImage 7v2_420_6.pngImage 8v2_420_7.png",
"answer": "Image 1: Not wearing a helmet\n Image 2: Not wearing a helmet\n Image 3: Wearing a helmet.\nImage 4: Wearing a helmet.\nImage 5: Wearing a helmet.\nImage 6: Wearing a helmet.\nImage 7: Wearing a helmet.\n Image 8: Not wearing a helmet.\n Summary: Out of the 8 people, 5 are wearing helmets, and 3 are not wearing helmets.",
"capability": [
"rec",
"seq",
"gen"
],
"added_in": "v2"
},
"v2_421": {
"question": "For below image, find what products are presented in the basket. Try to be accuratev2_421_0.png",
"answer": "Smoked hamApplePink tulipsCrab dipStrawberries",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_422": {
"question": "Here is a list of reference images:\nShrimpv2_422_0.pngCrab dipv2_422_1.pngSmoked Hamv2_422_2.pngBananav2_422_3.pngApplev2_422_4.pngBreadv2_422_5.pngCheesev2_422_6.pngStrawberriesv2_422_7.pngPink Tulipsv2_422_8.pngFor below image, find what products are presented in the basket according to reference image above. Only tell me products that are exactly same type of reference images. v2_421_0.png",
"answer": "Smoked hamApplePink tulipsCrab dipStrawberries",
"capability": [
"rec",
"seq"
],
"added_in": "v2"
},
"v2_423": {
"question": "Write a radiology report for this image as an expert radiologist.v2_423_0.png",
"answer": "Radiology Report \n Exam: Abdominal X-ray\n History: The patient presents with abdominal pain and distention.\n Findings: The abdominal X-ray shows a dilated stomach and small bowel loops, indicating a partial small bowel obstruction. There is also a small amount of air present in the rectum. No free intraperitoneal air or pneumoperitoneum is observed. The liver, spleen, and kidneys appear normal.\n Impression: The findings suggest that there is a partial small bowel obstruction. Further imaging studies and clinical correlation are recommended.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_424": {
"question": "Write a radiology report as an expert radiologist for the following case.v2_424_0.png",
"answer": "An MRI of the right knee has revealed a significant build-up of fluid in the joint, which is most noticeable in the suprapatellar region. The scan also detected evidence of a tear in the medial meniscus and mild degenerative changes in the articular cartilage. However, the anterior cruciate ligament, posterior cruciate ligament, and extensor mechanism are all intact, and no other significant abnormalities were observed. In summary, this indicates there is a large joint effusion and a medial meniscal tear in the right knee, with mild degenerative changes present in the articular cartilage.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_425": {
"question": "Write a radiology report as an expert radiologist for the following case:\nCase:\nA 32-year-old woman presented with a complaint of pain in her right wrist. The patient reported that she fell on her outstretched hand while playing basketball. An X-ray of the right wrist was performed.v2_425_0.png",
"answer": "Radiology Report:\nExam: X-ray of the right wrist\nIndication: Right wrist pain after falling on outstretched hand while playing basketball\nFindings: There is a transverse fracture of the distal radius with mild dorsal angulation. No other fractures or dislocations are seen. The carpal bones are in normal alignment. No significant soft tissue swelling is noted.\nImpression: Transverse fracture of the distal radius with mild dorsal angulation. No other fractures or dislocations are seen.\nRecommendation: Orthopedic consultation for management of the fracture.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_426": {
"question": "Write a radiology report for this image as an expert radiologist.v2_426_0.png",
"answer": "Report:\nExam: X-ray of the right hand and wrist\nTechnique: AP and lateral views were obtained\nFindings: The bones of the right hand and wrist appear intact and in proper alignment. There is an obvious distal radial fracture.\nThe joint spaces are preserved and there is no evidence of degenerative changes. No soft tissue abnormalities are seen.\nImpression: Normal X-ray of the right hand and wrist.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_427": {
"question": "Write a radiology report for this image as an expert radiologist.v2_427_0.png",
"answer": "Report:\nStudy Type: Chest CT\nSubject: 42-year-old male\nFindings: The chest CT images demonstrate a nodular opacity in the left upper lobe, measuring approximately 1.3 cm in diameter. The opacity appears to have spiculated margins and is located adjacent to the pleura. There is no evidence of mediastinal or hilar lymphadenopathy.\nImpression: The findings are concerning for a primary lung malignancy. Further evaluation with a biopsy is recommended to confirm the diagnosis. ",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_428": {
"question": "Write a radiology report as an expert radiologist for the following case.v2_428_0.png",
"answer": "Report:\nModality: Magnetic Resonance Imaging (MRI)\nBody Part: Brain\nTechnique: Axial T1-weighted\nFindings: The MRI of the brain demonstrates a large intra-axial mass in the left parietal lobe with surrounding edema. The mass appears to be heterogeneous in signal intensity with areas of high and low signal intensity. There is a significant mass effect with midline shift to the right. The ventricles appear to be compressed and there is evidence of hydrocephalus. No other significant abnormalities are noted.\nImpression: Large intra-axial mass in the left parietal lobe with surrounding edema and significant mass effect. Likely high-grade glioma. Further imaging and clinical correlation are recommended.",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_429": {
"question": "The first image is a chest x-ray scan the patient took last time. The previous diagnoses mention pleural effusion.v2_429_0.pngv2_429_1.png",
"answer": "Radiology Report\nExam: Chest X-ray\nFindings: The chest x-ray scan taken this time shows a significant improvement in the patient's condition compared to the previous scan. The previous scan showed a pleural effusion, which is a buildup of fluid in the space between the lungs and chest wall. However, the current scan shows that the pleural effusion has resolved. There is no evidence of any new abnormalities in the lungs or chest wall. The lungs appear to be well-expanded and the heart size is normal. The mediastinum, which is the space between the lungs, is also within normal limits.\nConclusion: The patient's condition has improved since the last chest x-ray scan, with resolution of the previously noted pleural effusion. No new abnormalities are seen.",
"capability": [
"rec",
"know",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_430": {
"question": "The first image is a chest x-ray scan the patient took last time. The previous diagnoses mention pleural effusion.v2_430_0.pngv2_430_1.png",
"answer": "Radiology Report\nExam: Chest X-ray\nFindings: The chest x-ray scan taken this time shows a significant worsening of the patient's pleural effusion. The fluid accumulation in the pleural space is more prominent than in the previous scan. The lung fields are also more hazy and congested, indicating a possible infection or inflammation. The heart and mediastinal contours are obscured by the fluid, making it difficult to assess their size and shape. \nImpression: The patient's pleural effusion has worsened, and there is a possibility of an underlying infection or inflammation. Further evaluation and management are recommended.",
"capability": [
"rec",
"know",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_431": {
"question": "Imagine that you are an expert in evaluating the car damage from car accident for auto insurance reporting. Please evaluate the damage seen in the image below.v2_431_0.png",
"answer": "From the pictures, the car appears to have damage to the front passenger side bumper. The damage appears to be in the form of scuffs and scratches, and in some areas the paint has peeled off. The damage appears to be cosmetic only and does not affect the bumper or the structural integrity of the car. However, it should be noted that the pictures only show one angle of the car and do not provide a full picture of the damage. A more thorough inspection of the car is needed to fully assess the extent of the damage and determine if there are any underlying issues that are not visible in the pictures.",
"capability": [
"rec",
"gen",
"know"
],
"added_in": "v2"
},
"v2_432": {
"question": "Imagine that you are an expert in evaluating the car damage from car accident for auto insurance reporting. Please evaluate the damage seen in the image below.v2_432_0.png",
"answer": "Based on the image, it seems that the front part of the vehicle has suffered significant damage. The hood is crumpled, and the front bumper is partially detached. It appears that the headlights are also damaged. It is likely that the vehicle was involved in a collision from the front. Although the damage seems to be mainly cosmetic, there may be underlying structural damage to the frame or engine. A thorough inspection would be necessary to assess the complete extent of the damage. As far as repair costs are concerned, the hood and bumper would most likely need to be replaced, and the headlights may need to be repaired or replaced as well. The repair costs would depend on the make and model of the vehicle, but they would probably amount to several thousand dollars, at the very least.",
"capability": [
"rec",
"gen",
"know"
],
"added_in": "v2"
},
"v2_433": {
"question": "Imagine that you are an expert in evaluating the car damage from car accident for auto insurance reporting. Please evaluate the damage seen in the image below.v2_433_0.png",
"answer": "Based on the image, it seems that the car has suffered damage to the rear bumper and quarter panel on the driver's side. The bumper appears to be dented and scratched, while the quarter panel has a significant dent and some scuff marks. It is likely that the car was hit from the side, causing damage to both the bumper and the quarter panel. As for the cost of repair, the bumper may be repairable with some minor body work and repainting. However, the quarter panel may require more extensive repairs, or even replacement, which could be more expensive. All in all, I would estimate the damage to be moderate to severe, with repair costs likely to run into the thousands of dollars.",
"capability": [
"rec",
"gen",
"know"
],
"added_in": "v2"
},
"v2_434": {
"question": "Imagine that you are an expert in evaluating the car damage from car accident for auto insurance reporting. Please evaluate the damage seen in the image below v2_434_0.png",
"answer": "Based on the image, it seems that the vehicle has suffered severe damage to the front end. The hood is crumpled, and the front bumper is entirely detached from the vehicle. The headlights and grille are also damaged, and the engine appears to be exposed. Furthermore, there is damage to the driver's side fender and door. Considering the extent of the damage, it is likely that the vehicle was involved in either a high-speed or head-on collision. The cost of repairs for this vehicle will probably be substantial, and the insurance company may consider it a total loss.",
"capability": [
"rec",
"gen",
"know"
],
"added_in": "v2"
},
"v2_435": {
"question": "Imagine that you are an expert in evaluating the car damage from car accident for auto insurance reporting. Please fill the incident report for the accident shown in image below, with the following format in JSON (note xxx is placeholder, if you cannot determine that based on the image, put \"N/A\" instead).\n{\"make\": xxx, \"model\": xxx, \"license plate\": xxx, \"damage description\": xxx, \"estimated cost of repair\": xxx}v2_435_0.png",
"answer": "{\"make\": \"Maruti Suzuki\", \"model\": \"Celerio\", \"license plate\": \"KL 52 N 5305\", \"damage description\": \"Front bumper, hood, and windshield damaged. Airbags deployed.\", \"estimated cost of repair\": \"N/A\"}",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v2"
},
"v2_436": {
"question": "Imagine that you are an expert in evaluating the car damage from car accident for auto insurance reporting. Please evaluate the damage seen in the image below. For filing the incident report, please follow the following format in JSON (note xxx is placeholder, if the information is not available in the image, put \"N/A\" instead).\n{\"make\": xxx, \"model\": xxx, \"license plate\": xxx, \"damage description\": xxx, \"estimated cost of repair\": xxx}v2_436_0.png",
"answer": "{\"make\": \"Toyota\", \"model\": \"Corolla\", \"license plate\": \"6G7B414\", \"damage description\": \"Front bumper and hood damage, driver side fender damage, driver side headlight damage\", \"estimated cost of repair\": \"$2,500-$3,500\"} ",
"capability": [
"rec",
"ocr",
"know",
"gen"
],
"added_in": "v2"
},
"v2_437": {
"question": "Here are the photos of my family members.\nLindav2_437_0.pngCottonv2_437_1.pngMaxv2_437_2.pngSamv2_437_3.pngEmmav2_437_4.pngPlease describe the image with as many details as possible, using my family members\u2019 names.v2_437_5.png",
"answer": "This is a family portrait of Linda, her children Emma and Sam, and their pets, Max the dog and Cotton the cat. The family is sitting in their living room, with Linda on the couch and Emma and Sam on the floor. Max is sitting between Linda and Emma, with his tongue sticking out, while Cotton is perched on Linda's shoulder. All family members are smiling and looking at the camera. The room is bright and airy, with a vase of yellow flowers on the coffee table and a white bookshelf in the background.",
"capability": [
"rec",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_438": {
"question": "Here are the photos of my family members.\nLindav2_437_0.pngCottonv2_437_1.pngMaxv2_437_2.pngSamv2_437_3.pngEmmav2_437_4.pngPlease describe the image with as many details as possible, using my family members\u2019 names.v2_438_5.png",
"answer": "In this image, you can see three members of my family: my brother Sam, our dog Max, and myself, Emma. We are lying on a grassy field under a clear blue sky. Sam and I are resting our heads on our hands, smiling at the camera, while Max is lying between us with his tongue out. We are all enjoying the beautiful weather and spending quality time together as a family.",
"capability": [
"rec",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_439": {
"question": "Describe the objects below with as many details as possible, Reference to the content shown in the context image but focus on describing each object below.\nObject 1v2_439_0.pngObject 2v2_439_1.pngObject 3v2_439_2.pngObject 4v2_439_3.pngContext imagev2_439_4.png",
"answer": "Object 1 is a close-up of a snail's shell. The shell is light beige with a spiral pattern on the top. It appears slightly weathered, with small chips and cracks visible on the edges. The background is white, making the shell the main focus of the image. It is angled slightly with the spiral pattern facing towards the right side of the image. \n Object 2 is a close-up of a snail. The snail has a light orange shell with a spiral pattern. Its body is darker orange with small bumps on the skin. The snail's head is extended forward and its antennae are visible. The background is white, making the snail the main focus of the image.\n Object 3 shows a close-up of a frog with a snail on its head. The frog is light green with a pinkish hue on its underside. It has large black and white bulging eyes. The snail is orange and perched on top of the frog's head. The frog is sitting on a rock or flat surface with its legs tucked underneath. The background is white, making the frog and snail stand out.\n Object 4 is a close-up of a turtle's head and neck, with its body partially visible. The turtle appears to be floating in water, with its head and neck extended upwards. Its skin is green, and its shell is grey with black stripes. The shell appears to be damaged, with a large chunk missing from the top. The turtle's eyes are closed, and its mouth is slightly open.",
"capability": [
"rec",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_440": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \"a parrot driving a car\"?v2_440_0.png",
"answer": "On a scale of 1 to 10, I would have this image a 1 in similarity to the text prompt \"a parrot driving a car\" as there is no parrot or car present in the image.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_441": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \"a parrot driving a car\"?v2_441_0.png",
"answer": "The image depicts a parrot soaring in the sky with trees and clouds visible in the background. Based on the text prompt \"a parrot driving a car\", I would rate this image a 2 in terms of similarity. Although a parrot is present in the image, it is not seen driving a car.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_442": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \"a parrot driving a car\"?v2_442_0.png",
"answer": "In the image there is a parrot perched on a car; it is not driving the car, but it is seated on the car. I would rate this image a 4 in terms of similarity to the text prompt \"a parrot driving a car\" because there is a parrot and a car present but the parrot is not driving the car.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_443": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \"a parrot driving a car\"?v2_443_0.png",
"answer": "In this image, a parrot's head is superimposed onto a moving car on the road, with the parrot appearing to be the driver. Although the parrot's body is not visible, the image clearly depicts a parrot in the driver's seat. However, the car itself is not very clear and seems to be a blurred image. On a scale of 1 to 10, I would give this image an 8 in terms of how well it matches the text prompt \"a parrot driving a car\".",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_444": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \"a parrot driving a car\"?v2_444_0.png",
"answer": "In this image, there are two parrots perched on top of a car - one red and one yellow. The yellow parrot is holding the steering wheel and appears to be driving the car. If we were to rate this image on a scale of 1 to 10, with 10 being the most similar to the text prompt \"a parrot driving a car\", I would give it a rating of 9. The only reason it falls short of a perfect 10 is that there are two parrots in the image, whereas the prompt suggests only one.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_445": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \u201ca cake on the table with word \u201cAzure Research\u201d written on it\"?v2_445_0.png",
"answer": "In the image, there is a cake on a table with the words \"Azuze Research\" written on it. I would rate this image an 8 out of 10 in similarity to the text prompt \"a cake on the table with word 'Azure Research' written on it\" because the only difference is the misspelling of \"Azure\" as \"Azuze.\" ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_446": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \u201ca cake on the table with word \u201cAzure Research\u201d written on it\"?v2_446_0.png",
"answer": "In the image, there is a blue cake on a table with the word \"ARAUIE\" written on it. On a scale of 1 to 10, I would rate this image a 6 in terms of similarity to the text prompt \"a cake on the table with word 'Azure Research' written on it\". \nThe image does show a cake on a table, but the word written on the cake is not an exact match to the text prompt. The color of the cake is also blue, which could be seen as similar to the word \"Azure\" in the prompt. ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_447": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \u201ca cake on the table with word \u201cAzure Research\u201d written on it\"?v2_447_0.png",
"answer": "In the image, there is a cake on a table with the words \"Azure Aurre\" written on it. I would rate this image an 8 out of 10 in similarity to the text prompt \"a cake on the table with word 'Azure Research' written on it\" because the image does show a cake on a table with the word \"Azure\" written on it, but the word \"Research\" is not present. ",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_448": {
"question": "What is happening in the image? From scale 1 to 10, decide how similar the image is to the text prompt \u201ca cake on the table with word \u201cAzure Research\u201d written on it\"?v2_448_0.png",
"answer": "In the image, there is a two-tiered cake on a table with the words \"Azure Research\" in blue icing. I would rate this image a 9 out of 10 in terms of similarity to the text prompt as it very closely matches the description I gave it a 10 because the text prompt does not mention the two layers or the additional decorations on the cake.",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_449": {
"question": "This is the original image:v2_449_0.pngI want to make this image look like graphic novel cover. The prompt should be a single sentence in less than 15 words with descriptive words. For example: \u201chave it look like a graphic novel\u201d.\nBased on the above prompt examples and the original image, help me to write a better prompt to an image editing model. ",
"answer": "\"Transform this image of a statue into a dramatic graphic novel cover with a dark tone.\"",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_450": {
"question": "This is the original image:v2_449_0.pngThe prompt I used to edit this image is \u201chave it look like a graphic novel\u201d.\nThe edited image I got is:v2_450_1.pngTell me how I should change my prompt to make the edited image better.",
"answer": "Instead of using the prompt \u201chave it look like a graphic novel\u201d you could try being more specific with the prompt to guide AI in the direction you want the image to go. For example, you could use prompts such as \u201cMake the image look like a black and white comic book illustration\u201d or \u201cAdd bold lines and high contrast to the image to make it look like a graphic novel cover\u201d. This could help the AI better understand the aesthetic you are going for and produce a more refined edited image.",
"capability": [
"rec",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_451": {
"question": "First, read the operating menu below for coffee machine buttons.\nMenu:v2_451_0.pngNow, let's look at the operating panel of the coffee machine in the image below, which button should I use for a 8 OZ coffee: left, right, top or bottom button?v2_451_1.png",
"answer": "You should use the bottom button for an 8 OZ coffee. According to the menu, the bottom button corresponds to a 8 OZ coffee, while the top button is for a switch button and the right button is for a 10 OZ coffee.",
"capability": [
"rec",
"ocr",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_452": {
"question": "First, read the operating menus below for coffee machine buttons.\nMenu 1:v2_452_0.pngMenu 2:v2_452_1.pngMenu 3:v2_452_2.pngNow, let's look at the operating panel of the coffee machine in the image below, which button should I use for a 6 OZ coffee: left, right, top or bottom button?v2_451_1.png",
"answer": "Use the left button to get a 6 OZ coffee.",
"capability": [
"rec",
"ocr",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_453": {
"question": "Imagine that you are a home robot, and is asked to go to the kitchen to fetch something from the fridge.\nThe image below shows your current position. Please plan your next action.v2_453_0.png",
"answer": "My next action would be to turn left and move towards the hallway as I see that the kitchen is likely located in this direction and then continue to navigate through the hallway until I reach the kitchen and locate the fridge.",
"capability": [
"rec",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_454": {
"question": "Imagine that you are a home robot, and is asked to go to the kitchen to fetch something from the fridge.\nAt the previous turn, you were at the position shown in the below image:v2_453_0.pngThe action taken in previous turn is: turn right and move forward towards the hallway.\nNow you are at the hallway, this is what you can see from there. Can you see the kitchen from here? What is your next action?v2_454_1.png",
"answer": "I can see the kitchen from my current position on the right side of the room. My next action would be to turn right and move towards the kitchen.",
"capability": [
"rec",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_455": {
"question": "Imagine that you are a home robot, and is asked to go to the kitchen to fetch something from the fridge.\nAt the previous turn, you were at the position shown in the below image:v2_454_1.pngThe action taken in previous turn is: turn right and move forward towards the kitchen.\nNow you are at the kitchen, this is what you can see from there. Can you see the fridge from here? What is your next action?v2_455_1.png",
"answer": "From this position, I can see the fridge on the right side of the kitchen. My next action would be to move forward and turn gently to the right to approach the refrigerator.",
"capability": [
"rec",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_456": {
"question": "Imagine that you are a home robot, and is asked to go to the kitchen to fetch something from the fridge.\nAt the previous turn, you were at the position shown in the below image:v2_455_1.pngThe action taken in previous turn is: move forward and turn slightly to the right to approach the fridge.\nNow this is what you can see from there. What is your next action?v2_456_1.png",
"answer": "The next step would be to move forward and slightly to the left to align with the fridge door and then use my robotic arm to open the fridge door and retrieve the item being requested.",
"capability": [
"rec",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_457": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard.\nYou are asked to find a detailed recipe of Mapo Tofu.\nBelow is what you see on the computer screen, predict your next move. If the action involves moving the mouse, describe the location as detailed as possible.v2_457_0.png",
"answer": "Next move : I would move the mouse to the Google Chrome icon on the left side of the screen, approximately 1/3 of the way down from the top and then click the icon to open the web browser.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_458": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find a detailed recipe of Mapo Tofu.\nPrevious action: \"I would move the mouse to the Google Chrome icon located on the left side of the screen, approximately 1/3 of the way down from the top. I would then click on the icon to open the web browser. \"\nYou have now opened the web browser. Below is what you see on the computer screen. What will you do next? If the action involves moving the mouse, describe the location as detailed as possible.v2_458_0.png",
"answer": "Next, I would move the mouse to the search bar, which is located in the center of the screen and positioned approximately halfway down from the top. Then, I would click on the search bar and type \"Mapo Tofu recipe\" using the keyboard. Once I have typed in the search query, I would press the \"Enter\" key on the keyboard to initiate the search.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_459": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find a detailed recipe of Mapo Tofu.\nPrevious action: \" I would move the mouse to the search bar located in the center of the screen, approximately 1/2 of the way down from the top. I would then click on the search bar and type in \"Mapo Tofu recipe\" using the keyboard. After typing in the search query, I would press the \"Enter\" key on the keyboard to initiate the search.\"\nYou have now completed the previous action as described above. Below is what you see on the computer screen. What will you do next? If the action involves moving the mouse, describe the location as detailed as possible.v2_459_0.png",
"answer": "Next action would be to put the mouse forwards to the first search result under the \"Recipes\" section, which is called \"Mapo Tofu Recipe - The Woks of Life\", then click on the link to open the website and view the detailed recipe.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_460": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find a detailed recipe of Mapo Tofu.\nPrevious action: \u201cI would move the mouse to the first search result under the \"Recipes\" section, which is titled \"Mapo Tofu Recipe - The Woks of Life\". I would then click on the link to open the webpage and view the detailed recipe.\"\nYou have now completed the previous action as described above. Below is what you see on the computer screen. Based on the image below, what will you do next? If the action involves moving the mouse, describe the location as detailed as possible.v2_460_0.png",
"answer": "Next action: \"I would move the mouse to the \"Jump to Recipe\" button in the top right corner of the webpage then click on the button to jump to the detailed recipe section of the page.\"",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_461": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find a detailed recipe of Mapo Tofu.\nPrevious action: \u201cI would move the mouse to the \"Jump to Recipe\" button located at the top right corner of the webpage. I would then click on the button to jump to the detailed recipe section of the page.\"\nYou have now completed the previous action as described above. Below is what you see on the computer screen. Based on the image below, what will you do next? If the action involves moving the mouse, describe the location as detailed as possible.v2_461_0.png",
"answer": "Next action: \"I would move the mouse to the \"Print Recipe\" button located in the top right corner of the Recipe section next to the button \"Rate This Recipe\" and then click on the button to print a copy of the detailed recipe for Mapo Tofu \"",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_462": {
"question": "Describe the image below as detailed as possible.v2_462_0.png",
"answer": "The image is a recipe for Mapo Tofu, a Chinese dish. The recipe is presented in a structured format with a title, description, prep time, cook time, total time, course, cuisine, servings, and rating. \nThe title of the recipe is \"Mapo Tofu\" and it is written in bold black letters. Below the title, there is a description of the dish which states that it is the true blue, authentic real deal - the spicy, tongue-numbing, rice-is-absolutely-not-optional Mapo Tofu that you get in the restaurants. \nThe prep time for the dish is 10 minutes, the cook time is 25 minutes, and the total time is 35 minutes. The course is listed as \"Main Course\" and the cuisine is \"Chinese\". The recipe serves 6 people and has a rating of 4.89 stars out of 5.\nBelow this information, there is a list of ingredients required for the dish, including tofu, ground pork, Sichuan peppercorn, garlic, ginger, soy sauce, and cornstarch. The ingredients are listed in a bullet point format.\nAt the bottom of the image, there is nutritional information for the dish, including calories, carbohydrates, protein, fat, saturated fat, cholesterol, sodium, and calcium. The nutritional information is presented in a table format.\nThe image also includes a credit to the author of the recipe, Kaitlin, and a link to the original recipe on the website \"The Woks of Life\". ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_463": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard.\nYou are asked to find what\u2019s in the news today.\nBelow is what you see on the computer screen, predict your next move. If the action involves moving the mouse, describe the location as detailed as possible.v2_457_0.png",
"answer": "My next move would be to move the mouse to the Google Chrome icon on the left side of the screen, about 1/3 of the way down from the top, then click the icon to open the web browser and search for news sites to find out what's in the news today.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_464": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find what\u2019s in the news today.\nPrevious action: \"My next move would be to move the mouse to the Google Chrome icon located on the left side of the screen, approximately 1/3 of the way down from the top. I would then click on the icon to open the web browser and search for news websites to find out what's in the news today. \"\nYou have now opened the web browser. Below is what you see on the computer screen, what is your immediate next step? If the action involves moving the mouse, describe the location as detailed as possible.v2_458_0.png",
"answer": "The next step would be to move the mouse to the search bar located in the center of the screen, about 1/2 the way down from the top, then I would click the search bar and type in \"news\" and press the enter key on the keyboard to search for news sites.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_465": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find what\u2019s in the news today.\nPrevious action: \"My immediate next step would be to move the mouse to the search bar located in the center of the screen, approximately 1/2 of the way down from the top. I would then click on the search bar and type in \"news\" and press the enter key on the keyboard to search for news websites. \"\nYou have now completed the previous action. Below is what you see on the computer screen. Based on the image below, what is your immediate next step? If the action involves moving the mouse, describe the location as detailed as possible.v2_465_0.png",
"answer": "My immediate next step would be to move the mouse to the first search result which is \"State Department doubles down on Zelensky Slams\" located around 1/4 of the way down the screen and 1/8 of the way from the left side of the screen. I would then click on the link to open the news article and read about what is in the news today.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_466": {
"question": "Read the article shown in the images below and summarize it.v2_466_0.pngv2_466_1.png",
"answer": "The article discusses Ukrainian President Volodymyr Zelensky's statement made on Tuesday expressing his country's desire to join NATO. Zelensky explained that Ukraine cannot afford to go to war with Russia and that joining NATO would provide the necessary security and protection. However, Matthew Miller, a spokesperson for NATO, stated that Ukraine must meet certain conditions such as democratic and security-sector reforms before the alliance can extend an invitation to join. Miller also emphasized that Ukraine's entry into NATO is not guaranteed and that the decision ultimately lies with the members of the alliance. During a press conference on Tuesday, Zelensky reiterated his commitment to strengthening democracy in Ukraine, which is a necessary condition for NATO membership.",
"capability": [
"rec",
"ocr",
"gen",
"spat",
"seq"
],
"added_in": "v2"
},
"v2_467": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find what\u2019s in the news today.\nPrevious action: \"My immediate next step would be to move the mouse to the first search result, which is \"State Department doubles down on Zelensky slams\" located approximately 1/4 of the way down from the top of the screen and 1/8 of the way from the left side of the screen. I would then click on the link to open the news article and read about what's in the news today.\"\nYou have now completed reading \u201cState Department doubles down on Zelensky slams\u201d. What is your immediate next step? If the action involves moving the mouse, describe the location as detailed as possible.v2_467_0.png",
"answer": "My immediate next step would be to move the mouse to the top right corner of the screen, where I can see the \"X\" icon to close the current tab. I would then click on the \"X\" icon to close the tab and return to the previous page to continue browsing for more news articles. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_468": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nYou are asked to find what\u2019s in the news today.\nPrevious action: \"My immediate next step would be to move the mouse to the top right corner of the screen, where I can see the \"X\" icon to close the current tab. I would then click on the \"X\" icon to close the tab and return to the previous page to continue browsing for more news articles. \"\nYou have now returned to the previous page after reading the first article \u201cState Department doubles down on Zelensky slams\u201d. Below is what you see on the computer screen. Based on the image below, what is your immediate next step? If the action involves moving the mouse, describe the location as detailed as possible.v2_465_0.png",
"answer": "My immediate next step would be to move the mouse to the second article on the page, \"Catastrophic flooding swamps Florida Panhandle as intense storms force evacuations\". I would move the mouse to the left side of the article title approximately 1/3 of the way down the page, and click on the article title to open it and read the news.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_469": {
"question": "Read the article shown in the images below and summarize it.v2_469_0.pngv2_469_1.pngv2_469_2.pngv2_469_3.pngv2_469_4.pngv2_469_5.pngv2_469_6.png",
"answer": "The article discusses the catastrophic flooding that occurred on Tuesday, July 11, 2023 in Montpelier, the capital of Vermont. The flooding was caused by intense rainstorms that inundated the northeast, leading to evacuations and closures in the area. Vermont Governor Phil Scott declared a state of emergency, and the state of New Hampshire sent rescuers and Blackhawk helicopters to assist in the relief effort. The flooding caused significant damage to homes and businesses, and some residents were forced to evacuate. In Oklahoma City, two children, ages 10 and 11, were rescued from a reservoir after being swept away by floodwaters. In New York, Hurricane Irene caused 8 inches of rain in 24 hours, resulting in severe infrastructure damage. The article concludes with a quote from Dan Hancock, a resident of Chester, Vermont, who watched floodwaters pour into the basement of his home. He expresses his frustration and helplessness, saying, \"Once the water goes down, we go back, clean it up, and move on. What can we do?",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_470": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard.\nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nBelow is what you see on the phone screen, predict your next move. If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_470_0.png",
"answer": "My next move would be to move my finger to the Amazon icon, which is located in the third row and fourth column of the screen. I would then click on the icon to open the app and search for an ergonomic keyboard within my budget between $50 and $100. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_471": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard.\nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \"My next move would be to move my finger to the Amazon icon, which is located in the third row and third column of the screen. I would then click on the icon to open the app and search for an ergonomic keyboard within my budget of $50. \"\nYou have now opened the Amazon app. Below is what you see on the phone screen. What will you do next? If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_471_0.png",
"answer": "My next move would be to move my finger to the search bar, which is located at the top of the screen, then click on the search bar and type in \"ergonomic keyboard\" using the keyboard, and then click on the \"Search\" button located on the bottom right corner of the keyboard, to begin the search process.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_472": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard.\nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \"My next move would be to move my finger to the search bar, which is located at the top of the screen. I would then click on the search bar and type in \"ergonomic keyboard\" using the keyboard. After typing in the search term, I would click on the \"Search\" button, which is located on the bottom right corner of the keyboard, to initiate the search. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. Please predict your immediate next move. If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_472_0.png",
"answer": "My immediate next move would be to move my finger to the \"Filters\" button, which is located in the top right corner of the screen, next to the \"Windows\" button, then click on the \"Filters\" button to open my filter options and narrow down my search results to only show ergonomic keyboards within my budget range of $50 to $100.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_473": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard.\nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \"My immediate next move would be to move my finger to the \"Filters\" button, which is located at the top right corner of the screen, next to the \"Windows\" button. I would then click on the \"Filters\" button to open the filter options and narrow down my search results to only show ergonomic keyboards within my budget range of $50 to $100. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. Please predict your immediate next move. If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_473_0.png",
"answer": "My immediate next move would be to move my finger to the \"Price & Deals\" filter option, which is located under the \"Colors\" filter option and above the \"Sort by\" filter option then I would click on the \"Price & Deals\" filter option to open the price range filter and set my minimum price to $50 and my maximum price to $100. This further narrowed down my search results to only show ergonomic keyboards within my budget range.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_474": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard. \nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \" My immediate next move would be to move my finger to the \"Price & Deals\" filter option, which is located under the \"Colors\" filter option and above the \"Sort by\" filter option. I would then click on the \"Price & Deals\" filter option to open the price range filter and set my minimum price to $50 and my maximum price to $100. This would further narrow down my search results to only show ergonomic keyboards within my budget range. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. What will you do next? If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_474_0.png",
"answer": "My next move would be to move my finger to the \"Show 1,987 results\" button, located at the bottom of the screen, below the \"Clear Filters\" button and above the navigation bar, and then click on the \"Show 1,987 results\" button to view the results of my ergonomic keyboards within my budget range.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_475": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard. \nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \" My next move would be to move my finger to the \"Show 1,987 results\" button, which is located at the bottom of the screen, below the \"Clear Filters\" button and above the navigation bar. I would then click on the \"Show 1,987 results\" button to view the search results for ergonomic keyboards within my budget range. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. What will you do next? If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_475_0.png",
"answer": "My next move would be to scroll down the screen to view the different options for ergonomic keyboards within my budget range. I would then move my finger to the \"Kensington Pro Fit Ergonomic Wireless Keyboard - Black\" option, which is located below the \"Explore Related Brands\" section and above the \"VIVO\" option. I would then click on the \"Kensington Pro Fit Ergonomic Wireless Keyboard - Black\" option to view more details about the product and potentially make a purchase. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_476": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard. \nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \" My next move would be to scroll down the screen to view the different options for ergonomic keyboards within my budget range. I would then move my finger to the \"Kensington Pro Fit Ergonomic Wireless Keyboard - Black\" option, which is located below the \"Explore Related Brands\" section and above the \"VIVO\" option. I would then click on the \"Kensington Pro Fit Ergonomic Wireless Keyboard - Black\" option to view more details about the product and potentially make a purchase. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. What will you do next? If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_476_0.png",
"answer": "My next move would be to scroll down the screen to view more details about the \"Kensington Pro Fit Ergonomic Wireless Keyboard - Black\" product. I would then move my finger to click other points, which is located below the product image and above the \"Get a $8 bonus when you reload $100 or more to your gift card balance\" section. I would then click on the \"Buy New\" button to proceed with the purchase. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_477": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard. \nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \" My next move would be to scroll down the screen to view more details about the \"Kensington Pro Fit Ergonomic Wireless Keyboard - Black\" product. I would then move my finger to the \"Buy New\" button, which is located below the product image and above the \"Get a $8 bonus when you reload $100 or more to your gift card balance\" section. I would then click on the \"Buy New\" button to proceed with the purchase. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. What will you do next? If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_477_0.png",
"answer": "My next move would be to move my finger to the \"Add to Cart\" button, which is below the \"Buy New\" button and above the \"Ships from Amazon\" section and then click the \"Add to Cart\" button to add the item to my shopping cart.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_478": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard.\nYou are asked to shop for an ergonomic keyboard, your budget is between $50 and $100.\nPrevious action: \" My next move would be to move my finger to the \"Add to Cart\" button, which is located below the \"Buy New\" button and above the \"Ships from Amazon\" section. I would then click on the \"Add to Cart\" button to add the item to my shopping cart. \"\nYou have now completed the previous action as described above. Below is what you see on the phone screen. What will you do next? If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_478_0.png",
"answer": "My next move would be to move my finger to the \"Proceed to Checkout\" button, which is located above the \"Compare with similar items\" section and above the \"30-day returns\" section. I would then click on the \"Proceed to Checkout\" button to proceed with the purchase. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_479": {
"question": "Imagine that you are a robot operating a phone. Like how humans operate the phone, you can move your finger to an icon, click an icon with your finger, scroll down a screen, or type some texts with the keyboard.\nBelow is what you see on the phone screen. Describe the image and predict your next move. If the action involves moving your finger to an icon, describe the location of that icon as detailed as possible.v2_479_0.png",
"answer": "The image on the phone screen is the home screen of an iPhone. There are multiple app icons arranged in a grid-like pattern, including Calendar, Settings, Twitter, Amazon, Instagram, etc. At the top of the screen, there is a notification from a user named \"yykhahah\" that reads \"I see you are in Seattle, let's meet up.\" At the bottom of the screen, there is a search bar.\nBased on the notification, my next move would be to move my finger to the Maps app icon, which is located in the fourth row and the first column of the app grid. This will allow me to search for a location in Seattle and plan a meet up with the user. ",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_480": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nBelow is what you see on the computer screen. Describe the image and predict your next move. If the action involves moving the mouse, describe the location and the icon as detailed as possible.v2_480_0.png",
"answer": "The image on the computer screen is a desktop background of a bridge over a body of water. There are several icons on the desktop, including a YouTube icon, a recycle bin icon, and a terminal icon. There is a taskbar at the bottom of the screen with several application icons, such as Microsoft Edge and File Explorer. There is a notification in the bottom right corner of the screen that says \"Kevin Lin is calling you.\" Based on this notification, my next action is to move my mouse to the bottom right corner of the screen and click on the notification. This opens the calling application and allows me to answer Kevin Lin's call.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_481": {
"question": "Imagine that you are a robot operating a computer. Like how humans operate the computer, you can move the mouse, click an icon with the mouse, or type some texts with the keyboard. \nBelow is what you see on the computer screen. Describe the image and predict your next move. If the action involves moving the mouse, describe the location as detailed as possible.v2_481_0.png",
"answer": "The image on the computer screen is a desktop background of a beautiful bird's eye view of the Seaview Bridge. There are several icons on the left side of the screen including the recycle bin, terminal and a few others. My next move would be to move my mouse to the bottom right corner of the screen and click on Kevin Lin's notification to open the messaging application and reply to his message. I will move my mouse to the exact location of the notification, which is about 2 inches from the right edge of the screen and about 1 inch from the bottom edge of the screen.",
"capability": [
"rec",
"ocr",
"gen",
"spat"
],
"added_in": "v2"
},
"v2_482": {
"question": "Explain the story shown in the images below.v2_482_0.pngv2_482_1.pngv2_482_2.pngv2_482_3.png",
"answer": "The images show a reel on Instagram where a user humorously reveals the extravagant sum they've spent on their dog by employing Biden's quotes of hefty figures for comedic effect. The first image shows a man holding his dog with the caption \"When someone asks me how much I have spent on my dog\". The next three images show a clip of Joe Biden saying \"700 billion,\" \"700 billion and a trillion 300 million\" and \"700 billion and a trillion 300 billion dollars\", respectively.",
"capability": [
"rec",
"ocr",
"know",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_483": {
"question": "Tell me about the video content, given the frames below.v2_483_0.pngv2_483_1.pngv2_483_2.pngv2_483_3.pngv2_483_4.pngv2_483_5.png",
"answer": "The video content is a compilation of things that Asian people do for no reason. The video is posted on Instagram by user laparasian and has 1.3M views and 13.1K likes. The video is set to original audio by sophrelabelous and has the hashtag #asian and #relatable.\nThe video is broken down into 5 different scenes:\n1. The first scene shows a girl grabbing products from the back of the shelf in a supermarket.\n2. The second scene shows a girl rinsing a perfectly clean cup before using it.\n3. The third scene shows two girls asking \"have you eaten yet?\" as a form of greeting.\n4. The fourth scene shows two girls fighting aggressively for the bill in a restaurant.\n5. The fifth scene shows a girl wrapping pants around her neck to see if it fits.\nOverall, the video is a humorous take on some of the quirks and habits that are commonly seen in the Asian community.",
"capability": [
"rec",
"ocr",
"know",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_484": {
"question": "Transcribe the video content, given the frames below.v2_484_0.pngv2_484_1.pngv2_484_2.pngv2_484_3.pngv2_484_4.pngv2_484_5.pngv2_484_6.png",
"answer": "Hi everyone, I'm natyexplora and today I'm sharing 7 places you must visit in Washington State. \nFirst, we have North Cascades National Park. This park is filled with beautiful mountain views and hiking trails. This is a must visit for any nature lover. \nNext, we have the Olympic Peninsula. The area is home to the famous Hoh rainforest and beautiful beaches. This is a great place to relax and enjoy Washington's natural beauty. \nThird on the list is Mount Baker Wilderness. The area is famous for its stunning mountain scenery and hiking trails. It\u2019s a great place to escape the city and enjoy the great outdoors. \nNext, we will head to Mount Rainier National Park. Home to Washington's tallest mountain, the park is a great place for hiking and sightseeing. \nIn fifth place is Alpine Lakes Wilderness. The area is filled with beautiful mountain lakes and hiking trails. This is a great place to spend a day exploring and enjoying Washington\u2019s natural beauty. \nNext, we have Pilchuck Mountain State Park. This park is known for its beautiful scenery and hiking trails. This is a great place to spend a day exploring and enjoying Washington\u2019s natural beauty. \nLast but not least, we have the Gifford Pinchot National Forest. This forest offers beautiful mountain views and hiking trails. It\u2019s a great place to escape the city and enjoy the great outdoors. \nThat wraps up my list of 7 places you need to visit in Washington State. I hope you enjoy it and feel inspired to explore more of this beautiful state.",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_485": {
"question": "Tell me about the video content, given the frames below.v2_485_0.pngv2_485_1.png",
"answer": "The video is about a corgi named Tofu who works from home. The first frame shows Tofu sleeping in a bed and is titled \"WFH Staff: 8:59 AM.\" The second frame shows Tofu sitting in front of a computer with multiple screens, titled \"WFH Staff: 9:00 AM.\" The video may be a humorous take on the work-from-home experience, highlighting that Tofu, like other employees, has a hard time getting out of bed in the morning but is ready to work once in front of the computer.",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_486": {
"question": "Tell me about the video content, given the frames below. Please include as many details as possible.v2_486_0.pngv2_486_1.pngv2_486_2.pngv2_486_3.pngv2_486_4.pngv2_486_5.pngv2_486_6.pngv2_486_7.pngv2_486_8.png",
"answer": "The video features a tutorial on how to make raspberry bliss balls, a healthy breakfast for toddlers and older kids. The video was posted by the Instagram account \"mealtime with mummy\" and currently has over 13k likes. The next frame shows a larger mixing bowl with oats, chia seeds and peanut butter being added to the raspberry puree. The next frame shows a plate with shredded coconut, the raspberry mixture is rolled into small balls and then wrapped in shredded coconut. The last frame shows the finished raspberry bliss balls being placed in a bowl, ready to serve.",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_487": {
"question": "Tell me about the video content, given the frames below. Please include as many details as possible.v2_487_0.pngv2_487_1.pngv2_487_2.pngv2_487_3.pngv2_487_4.pngv2_487_5.pngv2_487_6.jpgv2_487_7.pngv2_487_8.png",
"answer": "The video features a recipe tutorial for Apple and Banana Pancakes. The video was posted on Instagram Reels by user \"mealtime with mummy\" and has 13.2K views. \\ In the first frame, we see a glass bowl with mashed bananas and apples. The second frame shows bananas and apples being mixed together. The third frame shows eggs being added to the mixture. The fourth frame shows a fork being used to stir the mixture. \\ The fifth frame shows a bowl of oats being added to the mixture. The sixth frame is stirring the oats with a spoon. The seventh frame shows spooning the mixture into the skillet. The eighth frame shows the pancake being cooked in the skillet. \\ The last frame shows the fried pancakes on a plate with apple slices, banana and yogurt. The title of the video is \"SAVE for easy breakfast inspo\" and the background music of the video is the song \"Stayin' Alive\" by the band Bee Ge. alive\".",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_488": {
"question": "Tell me about the video content, given the 9 frames below. Please include as many details as possible.v2_488_0.pngv2_488_1.pngv2_488_2.pngv2_488_3.pngv2_488_4.pngv2_488_5.pngv2_488_6.pngv2_488_7.pngv2_488_8.png",
"answer": "The video content is a recipe tutorial for strawberry stuffed French toast. The video is posted on Instagram Reels by the user \"mealtime with mummy\". The video has 13.2K likes and 190 comments.\nIn the first frame, we see a white plate with a dollop of red sauce and a dollop of white cream. The second frame shows the plate with the red sauce and white cream mixed together. The third picture shows a slice of bread with a hexagon torn out of the center by hand.\nThe fourth frame shows a plate with a circular piece of bread on it. The fifth frame shows a hand using a knife to spread a pink mixture onto the bread. The sixth frame shows the bread with the pink mixture covered with another piece of bread, making a sandwich.\nThe seventh frame shows a hand dipping the sandwich into a bowl of beaten eggs. The eighth frame shows the sandwich being fried in a pan. The final frame shows the finished strawberry stuffed French toast on a plate.\nThe video is set to the song \"Stayin' Alive\" by the Bee Gees. The caption reads \"SAVE for easy breakfast inspo \". ",
"capability": [
"rec",
"ocr",
"gen",
"seq"
],
"added_in": "v2"
},
"v2_489": {
"question": "Generate python code to draw similar curves.v2_489_0.png",
"answer": "``` import matplotlib.pyplot as plt\n import numpy as np\n # Sample data points for the x-axis (number of images in millions)\n x = np.array([1, 10, 100, 1000])\n # Sample data points for the y-axis (CIDEr scores)\n y_base = np.array([50, 70, 85, 100])\n y_large = np.array([60, 80, 100, 120])\n y_huge = np.array([70, 90, 110, 140])\n # Plotting the curves\n plt.figure(figsize=(6, 4))\n plt.plot(x, y_base, 'b-*', label='Base')\n plt.plot(x, y_large, 'r-x', label='Large')\n plt.plot(x, y_huge, 'g-o', label='Huge')\n # Setting the x-axis to be logarithmic\n plt.xscale('log')\n # Adding titles and labels\n plt.title('Model performance as a function of pre-training dataset size')\n plt.xlabel('Million images in pre-training')\n plt.ylabel('CIDEr')\n # Adding a legend\n plt.legend()\n # Adding grid\n # Display the plot\n plt.show()```",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_490": {
"question": "Write python code to generate similar figure.v2_490_0.png",
"answer": "``` import matplotlib.pyplot as plt\n # Task names and performance scores\n tasks = ['Caption', 'VQA', 'TR', 'IR', 'NLVR2']\n OSCaR_scores = [122, 72, 95, 90, 78]\n OSCaR_proportion = [100, 94, 100, 100, 100]\n MiniVLM_scores = [120, 70, 90, 85, 72]\n MiniVLM_proportion = [97, 96, 95, 95, 94]\n bar_width = 0.35 # width of the bars\n # Set position of bar on X axis\n r1 = np.arange(len(tasks))\n r2 = [x + bar_width for x in r1]\n # Make the plot\n plt.bar(r1, OSCaR_scores, color='blue', width=bar_width, label='OSCaR')\n plt.bar(r2, MiniVLM_scores, color='red', width=bar_width, label='MiniVLM (ours)')\n # Add text on top of the bars\n for i in range(len(tasks)):\n plt.text(r1[i], OSCaR_scores[i] + 3, f'{OSCaR_proportion[i]}%', ha='center', color='black')\n plt.text(r2[i], MiniVLM_scores[i] + 3, f'{MiniVLM_proportion[i]}%', ha='center', color='black')\n # Add xticks on the middle of the group bars\n plt.xlabel('Tasks', fontweight='bold')\n plt.xticks([r + bar_width / 2 for r in range(len(tasks))], tasks)\n # Create legend & Show graphic\n plt.legend()\n plt.show()```",
"capability": [
"rec",
"gen"
],
"added_in": "v2"
},
"v2_491": {
"question": "Count the number of boats in the image.v2_491_0.png",
"answer": "4",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_492": {
"question": "What is SE and how to compute to get its values in the image?v2_492_0.jpg",
"answer": "The \"SE\" in the image refers to \"Spherical Equivalent,\" which is a way to simplify a prescription for eyesight, combining the sphere (S) and cylinder (C) values of a lens. The spherical equivalent is calculated by taking the sphere value and adding half of the cylinder value.\n\nFor right eye, SE = S + (C/2\uff09= -2.25 + \uff08-1.25/2\uff09= -2.87\nFor left eye, SE = S + (C/2) = -1.25 + (-1.75/2) = -2.12",
"capability": [
"rec",
"ocr",
"gen"
],
"added_in": "v2"
},
"v2_493": {
"question": "I am playing as the red pieces, and it's my turn. Which piece should I move to achieve checkmate in one move?v2_493_0.jpg",
"answer": "\u70aeCannon",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_494": {
"question": "I am playing as the black pieces, and it's my turn. What move should I execute to achieve checkmate in one move?v2_494_0.png",
"answer": "Qh3#Qh3Queen moves to h3",
"capability": [
"rec",
"know",
"gen"
],
"added_in": "v2"
},
"v2_495": {
"question": "How many feet do these animals have in total?v2_495_0.jpg",
"answer": "16",
"capability": [
"rec",
"know"
],
"added_in": "v2"
},
"v2_496": {
"question": "Where might I be able to take this photo?v2_496_0.jpg",
"answer": "Window of the WorldShenzhen",
"capability": [
"rec",
"know"
],
"added_in": "v2"
},
"v2_497": {
"question": "Which drink has fewer total calories, the first or the second?v2_497_0.jpgv2_497_1.jpg",
"answer": "second",
"capability": [
"rec",
"ocr",
"seq"
],
"added_in": "v2"
},
"v2_498": {
"question": "Which line is longer, the top or the bottom?v2_498_0.jpg",
"answer": "bottom",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_499": {
"question": "Which ball is bigger, A or B?v2_499_0.jpg",
"answer": "A",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_500": {
"question": "How many feet do these animals have in total?v2_500_0.jpg",
"answer": "10",
"capability": [
"rec",
"know"
],
"added_in": "v2"
},
"v2_501": {
"question": "how many ducks are there in the image?v2_501_0.jpg",
"answer": "6",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_502": {
"question": "Is Yao Ming the tallest?v2_502_0.jpg",
"answer": "no",
"capability": [
"rec",
"know"
],
"added_in": "v2"
},
"v2_503": {
"question": "How many fingers does the right hand of the girl have?v2_503_0.jpg",
"answer": "",
"capability": [
"rec"
],
"added_in": "v2"
},
"v2_504": {
"question": "Is it possible for the car to move with magnetic force according to the Physical laws?v2_504_0.jpg",
"answer": "yes",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_505": {
"question": "Which track should the trolley go on, A or B?v2_505_0.jpg",
"answer": "A",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_506": {
"question": "Can we make sure the cat is alive before we open the box?v2_506_0.jpg",
"answer": "yes",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_507": {
"question": "Can we make sure the cat is alive before we open the box?v2_507_0.jpg",
"answer": "yes",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_508": {
"question": "From location A to location B, is it faster to go east or west?v2_508_0.jpg",
"answer": "east",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_509": {
"question": "Which circle is larger, A or B?v2_509_0.jpg",
"answer": "A",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_510": {
"question": "Are the red lines curved?v2_510_0.jpg",
"answer": "yes",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
},
"v2_511": {
"question": "As shown in the image, two iron balls are hanging on the Leaning Tower of Pisa, ball A weighs 20kg, and ball B weighs 5kg. If the ropes hanging them are cut at the same time and air resistance is ignored, which iron ball will land first?v2_511_0.jpg",
"answer": "A",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_512": {
"question": "Neglecting air buoyancy (vacuum), which side will go down, iron or cotton?v2_512_0.jpg",
"answer": "iron",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_513": {
"question": "Is it rabbit or duck?v2_513_0.jpg",
"answer": "duck",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_514": {
"question": "How many dwarfs are there near Snow White in the image?v2_514_0.jpg",
"answer": "6",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_515": {
"question": "Which bottle contains more water, the left or the right?v2_515_0.jpg",
"answer": "left",
"capability": [
"rec",
"spat",
"know"
],
"added_in": "v2"
},
"v2_516": {
"question": "How many feet does this elephant have in the image, 4 or 5?v2_516_0.jpg",
"answer": "4",
"capability": [
"rec",
"spat"
],
"added_in": "v2"
}
}