diff --git "a/ /HRBench4K_local.tsv" "b/ /HRBench4K_local.tsv" new file mode 100644--- /dev/null +++ "b/ /HRBench4K_local.tsv" @@ -0,0 +1,801 @@ +"index" "answer" "question" "A" "B" "C" "D" "category" "cycle_category" "image_path" +"0" "A" "What is the number displayed above the entrance where the woman is standing?" "27B" "37B" "27D" "27E" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/0.jpg" +"1" "B" "What is the number displayed above the entrance where the woman is standing?" "27E" "27B" "37B" "27D" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/1.jpg" +"2" "C" "What is the number displayed above the entrance where the woman is standing?" "27E" "27D" "27B" "37B" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/2.jpg" +"3" "D" "What is the number displayed above the entrance where the woman is standing?" "27E" "37B" "27D" "27B" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/3.jpg" +"4" "A" "What is the color of the mailbox?" "Blue" "Red" "Green" "Black" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/4.jpg" +"5" "B" "What is the color of the mailbox?" "Green" "Blue" "Black" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/5.jpg" +"6" "C" "What is the color of the mailbox?" "Green" "Black" "Blue" "Red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/6.jpg" +"7" "D" "What is the color of the mailbox?" "Green" "Black" "Red" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/7.jpg" +"8" "A" "Is the mailbox on the left or right side of the woman?" "Right" "Directly above" "In front" "Left" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/8.jpg" +"9" "B" "Is the mailbox on the left or right side of the woman?" "Left" "Right" "In front" "Directly above" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/9.jpg" +"10" "C" "Is the mailbox on the left or right side of the woman?" "Directly above" "In front" "Right" "Left" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/10.jpg" +"11" "D" "Is the mailbox on the left or right side of the woman?" "Directly above" "In front" "Left" "Right" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/11.jpg" +"12" "A" "What is written on the white board in front of the girl in purple shorts?" "ELEVATE" "ELEVATE." "ELVTE" "CeVaY" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/12.jpg" +"13" "B" "What is written on the white board in front of the girl in purple shorts?" "ELVTE" "ELEVATE" "CeVaY" "ELEVATE." "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/13.jpg" +"14" "C" "What is written on the white board in front of the girl in purple shorts?" "ELEVATE." "ELVTE" "ELEVATE" "CeVaY" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/14.jpg" +"15" "D" "What is written on the white board in front of the girl in purple shorts?" "ELVTE" "CeVaY" "ELEVATE." "ELEVATE" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/15.jpg" +"16" "A" "What is the text written on the blue golf ball holder?" "NEW MEXICO MUTUAL" "NEW YORK MUTUAL" "MUTUAL INSURANCE" "NEW MEXICO INSURANCE" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/16.jpg" +"17" "B" "What is the text written on the blue golf ball holder?" "MUTUAL INSURANCE" "NEW MEXICO MUTUAL" "NEW YORK MUTUAL" "NEW MEXICO INSURANCE" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/17.jpg" +"18" "C" "What is the text written on the blue golf ball holder?" "MUTUAL INSURANCE" "NEW MEXICO INSURANCE" "NEW MEXICO MUTUAL" "NEW YORK MUTUAL" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/18.jpg" +"19" "D" "What is the text written on the blue golf ball holder?" "NEW MEXICO INSURANCE" "NEW YORK MUTUAL" "MUTUAL INSURANCE" "NEW MEXICO MUTUAL" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/19.jpg" +"20" "A" "What is the color of the golf ball holder?" "Blue" "Red" "Black" "White" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/20.jpg" +"21" "B" "What is the color of the golf ball holder?" "Red" "Blue" "Black" "White" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/21.jpg" +"22" "C" "What is the color of the golf ball holder?" "Black" "Red" "Blue" "White" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/22.jpg" +"23" "D" "What is the color of the golf ball holder?" "White" "Black" "Red" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/23.jpg" +"24" "A" "What is the license plate number of the car?" "RK 879" "RK 789" "PK 879" "RK 876" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/24.jpg" +"25" "B" "What is the license plate number of the car?" "RK 789" "RK 879" "PK 879" "RK 876" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/25.jpg" +"26" "C" "What is the license plate number of the car?" "RK 876" "RK 789" "RK 879" "PK 879" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/26.jpg" +"27" "D" "What is the license plate number of the car?" "RK 876" "PK 879" "RK 789" "RK 879" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/27.jpg" +"28" "A" "Which side of the car is the person sitting on?" "Front (hood)" "Driver's side" "Passenger's side" "Back (trunk)" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/28.jpg" +"29" "B" "Which side of the car is the person sitting on?" "Back (trunk)" "Front (hood)" "Driver's side" "Passenger's side" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/29.jpg" +"30" "C" "Which side of the car is the person sitting on?" "Back (trunk)" "Driver's side" "Front (hood)" "Passenger's side" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/30.jpg" +"31" "D" "Which side of the car is the person sitting on?" "Back (trunk)" "Driver's side" "Passenger's side" "Front (hood)" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/31.jpg" +"32" "A" "Where is the water bottle placed relative to the person in the image?" "On the right side" "On the left side" "Behind the person" "In front of the person" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/32.jpg" +"33" "B" "Where is the water bottle placed relative to the person in the image?" "In front of the person" "On the right side" "Behind the person" "On the left side" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/33.jpg" +"34" "C" "Where is the water bottle placed relative to the person in the image?" "On the left side" "In front of the person" "On the right side" "Behind the person" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/34.jpg" +"35" "D" "Where is the water bottle placed relative to the person in the image?" "Behind the person" "On the left side" "In front of the person" "On the right side" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/35.jpg" +"36" "A" "Which brand is mentioned on the black rectangular device located at the left of the image?" "Insignia" "Samsung" "Apple" "Sony" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/36.jpg" +"37" "B" "Which brand is mentioned on the black rectangular device located at the left of the image?" "Apple" "Insignia" "Sony" "Samsung" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/37.jpg" +"38" "C" "Which brand is mentioned on the black rectangular device located at the left of the image?" "Samsung" "Apple" "Insignia" "Sony" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/38.jpg" +"39" "D" "Which brand is mentioned on the black rectangular device located at the left of the image?" "Apple" "Samsung" "Sony" "Insignia" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/39.jpg" +"40" "A" "What is the text written above the logo on the jacket's sleeve?" "epio MIX" "epog MIX" "epoc MIX" "epig MIX" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/40.jpg" +"41" "B" "What is the text written above the logo on the jacket's sleeve?" "epig MIX" "epio MIX" "epoc MIX" "epog MIX" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/41.jpg" +"42" "C" "What is the text written above the logo on the jacket's sleeve?" "epog MIX" "epoc MIX" "epio MIX" "epig MIX" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/42.jpg" +"43" "D" "What is the text written above the logo on the jacket's sleeve?" "epog MIX" "epoc MIX" "epig MIX" "epio MIX" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/43.jpg" +"44" "A" "What type of gloves is the person in the background wearing?" "White gloves" "Red gloves" "Black gloves" "Blue gloves" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/44.jpg" +"45" "B" "What type of gloves is the person in the background wearing?" "Red gloves" "White gloves" "Blue gloves" "Black gloves" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/45.jpg" +"46" "C" "What type of gloves is the person in the background wearing?" "Black gloves" "Red gloves" "White gloves" "Blue gloves" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/46.jpg" +"47" "D" "What type of gloves is the person in the background wearing?" "Blue gloves" "Black gloves" "Red gloves" "White gloves" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/47.jpg" +"48" "A" "Where is the person standing in relation to the recycle bin?" "In front of the recycle bin" "Behind the recycle bin" "To the right of the recycle bin" "To the left of the recycle bin" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/48.jpg" +"49" "B" "Where is the person standing in relation to the recycle bin?" "To the right of the recycle bin" "In front of the recycle bin" "Behind the recycle bin" "To the left of the recycle bin" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/49.jpg" +"50" "C" "Where is the person standing in relation to the recycle bin?" "To the right of the recycle bin" "To the left of the recycle bin" "In front of the recycle bin" "Behind the recycle bin" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/50.jpg" +"51" "D" "Where is the person standing in relation to the recycle bin?" "Behind the recycle bin" "To the left of the recycle bin" "To the right of the recycle bin" "In front of the recycle bin" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/51.jpg" +"52" "A" "What is the number written on the sign visible in the background of the image?" "08-26" "08-28" "09-27" "07-25" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/52.jpg" +"53" "B" "What is the number written on the sign visible in the background of the image?" "07-25" "08-26" "08-28" "09-27" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/53.jpg" +"54" "C" "What is the number written on the sign visible in the background of the image?" "08-28" "09-27" "08-26" "07-25" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/54.jpg" +"55" "D" "What is the number written on the sign visible in the background of the image?" "08-28" "07-25" "09-27" "08-26" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/55.jpg" +"56" "A" "What is the color of the sign in the image?" "Yellow and white" "White and red" "Yellow and green" "Green and white" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/56.jpg" +"57" "B" "What is the color of the sign in the image?" "Green and white" "Yellow and white" "Yellow and green" "White and red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/57.jpg" +"58" "C" "What is the color of the sign in the image?" "White and red" "Green and white" "Yellow and white" "Yellow and green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/58.jpg" +"59" "D" "What is the color of the sign in the image?" "White and red" "Green and white" "Yellow and green" "Yellow and white" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/59.jpg" +"60" "A" "What is the color of the umbrella?" "Blue" "Black" "Green" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/60.jpg" +"61" "B" "What is the color of the umbrella?" "Black" "Blue" "Red" "Green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/61.jpg" +"62" "C" "What is the color of the umbrella?" "Green" "Red" "Blue" "Black" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/62.jpg" +"63" "D" "What is the color of the umbrella?" "Black" "Red" "Green" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/63.jpg" +"64" "A" "What is the title of the framed poster visible in the image?" "Ely Diocese" "Ely Division" "Ely Diocess" "Ely Cathedral" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/64.jpg" +"65" "B" "What is the title of the framed poster visible in the image?" "Ely Diocess" "Ely Diocese" "Ely Cathedral" "Ely Division" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/65.jpg" +"66" "C" "What is the title of the framed poster visible in the image?" "Ely Diocess" "Ely Division" "Ely Diocese" "Ely Cathedral" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/66.jpg" +"67" "D" "What is the title of the framed poster visible in the image?" "Ely Diocess" "Ely Division" "Ely Cathedral" "Ely Diocese" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/67.jpg" +"68" "A" "What is the name of the barge on the left side of the image?" "PETER LIND" "PETER LUND" "PETER LING" "PETER LEND" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/68.jpg" +"69" "B" "What is the name of the barge on the left side of the image?" "PETER LING" "PETER LIND" "PETER LEND" "PETER LUND" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/69.jpg" +"70" "C" "What is the name of the barge on the left side of the image?" "PETER LUND" "PETER LEND" "PETER LIND" "PETER LING" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/70.jpg" +"71" "D" "What is the name of the barge on the left side of the image?" "PETER LUND" "PETER LEND" "PETER LING" "PETER LIND" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/71.jpg" +"72" "A" "What color is the neon ""OPEN"" sign hanging above the items for sale?" "Red and blue" "Blue and green" "Yellow and green" "White and blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/72.jpg" +"73" "B" "What color is the neon ""OPEN"" sign hanging above the items for sale?" "White and blue" "Red and blue" "Blue and green" "Yellow and green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/73.jpg" +"74" "C" "What color is the neon ""OPEN"" sign hanging above the items for sale?" "White and blue" "Yellow and green" "Red and blue" "Blue and green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/74.jpg" +"75" "D" "What color is the neon ""OPEN"" sign hanging above the items for sale?" "Blue and green" "Yellow and green" "White and blue" "Red and blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/75.jpg" +"76" "A" "What is written on the road sign directly below the American flag?" "ONE WAY" "NO ENTRY" "ONE KIT" "ONE KEY" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/76.jpg" +"77" "B" "What is written on the road sign directly below the American flag?" "NO ENTRY" "ONE WAY" "ONE KIT" "ONE KEY" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/77.jpg" +"78" "C" "What is written on the road sign directly below the American flag?" "ONE KIT" "ONE KEY" "ONE WAY" "NO ENTRY" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/78.jpg" +"79" "D" "What is written on the road sign directly below the American flag?" "ONE KIT" "NO ENTRY" "ONE KEY" "ONE WAY" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/79.jpg" +"80" "A" "What is the name or number written on the front of the train?" "460 112-6" "460 024-2" "460 042-4" "460 040-4" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/80.jpg" +"81" "B" "What is the name or number written on the front of the train?" "460 040-4" "460 112-6" "460 042-4" "460 024-2" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/81.jpg" +"82" "C" "What is the name or number written on the front of the train?" "460 040-4" "460 042-4" "460 112-6" "460 024-2" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/82.jpg" +"83" "D" "What is the name or number written on the front of the train?" "460 040-4" "460 042-4" "460 024-2" "460 112-6" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/83.jpg" +"84" "A" "How many dogs are being walked in the image?" "Four" "Five" "Two" "Three" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/84.jpg" +"85" "B" "How many dogs are being walked in the image?" "Five" "Four" "Two" "Three" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/85.jpg" +"86" "C" "How many dogs are being walked in the image?" "Five" "Three" "Four" "Two" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/86.jpg" +"87" "D" "How many dogs are being walked in the image?" "Three" "Five" "Two" "Four" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/87.jpg" +"88" "A" "What's color of the bike in the image?" "Yellow" "Black" "Red" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/88.jpg" +"89" "B" "What's color of the bike in the image?" "Black" "Yellow" "Blue" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/89.jpg" +"90" "C" "What's color of the bike in the image?" "Black" "Blue" "Yellow" "Red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/90.jpg" +"91" "D" "What's color of the bike in the image?" "Blue" "Red" "Black" "Yellow" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/91.jpg" +"92" "A" "Tell me the shape of the signboard attached to the building?" "Rectangular" "Oval" "Triangular" "Circular" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/92.jpg" +"93" "B" "Tell me the shape of the signboard attached to the building?" "Triangular" "Rectangular" "Oval" "Circular" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/93.jpg" +"94" "C" "Tell me the shape of the signboard attached to the building?" "Oval" "Triangular" "Rectangular" "Circular" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/94.jpg" +"95" "D" "Tell me the shape of the signboard attached to the building?" "Triangular" "Circular" "Oval" "Rectangular" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/95.jpg" +"96" "A" "What's the text written on the signboard in the image?" "frankfurter botschaft" "frankfurt botshaft" "frankfurt botschaft" "frankfurter botshaft" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/96.jpg" +"97" "B" "What's the text written on the signboard in the image?" "frankfurt botschaft" "frankfurter botschaft" "frankfurt botshaft" "frankfurter botshaft" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/97.jpg" +"98" "C" "What's the text written on the signboard in the image?" "frankfurt botshaft" "frankfurter botshaft" "frankfurter botschaft" "frankfurt botschaft" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/98.jpg" +"99" "D" "What's the text written on the signboard in the image?" "frankfurt botschaft" "frankfurt botshaft" "frankfurter botshaft" "frankfurter botschaft" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/99.jpg" +"100" "A" "What's the relative position of the orange building compared to the cylindrical green building?" "To the left" "Behind" "Directly in front" "To the right" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/100.jpg" +"101" "B" "What's the relative position of the orange building compared to the cylindrical green building?" "Directly in front" "To the left" "To the right" "Behind" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/101.jpg" +"102" "C" "What's the relative position of the orange building compared to the cylindrical green building?" "Behind" "To the right" "To the left" "Directly in front" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/102.jpg" +"103" "D" "What's the relative position of the orange building compared to the cylindrical green building?" "To the right" "Behind" "Directly in front" "To the left" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/103.jpg" +"104" "A" "What is the name of the place mentioned on the signboard above the left door?" "ABRI PATAUD" "ABRI PATEAU" "ABRI PATARD" "ABRI PRATARD" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/104.jpg" +"105" "B" "What is the name of the place mentioned on the signboard above the left door?" "ABRI PATARD" "ABRI PATAUD" "ABRI PRATARD" "ABRI PATEAU" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/105.jpg" +"106" "C" "What is the name of the place mentioned on the signboard above the left door?" "ABRI PATARD" "ABRI PRATARD" "ABRI PATAUD" "ABRI PATEAU" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/106.jpg" +"107" "D" "What is the name of the place mentioned on the signboard above the left door?" "ABRI PATEAU" "ABRI PATARD" "ABRI PRATARD" "ABRI PATAUD" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/107.jpg" +"108" "A" "What color is the backpack carried by the man wearing a yellow shirt?" "Blue" "Green" "Black" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/108.jpg" +"109" "B" "What color is the backpack carried by the man wearing a yellow shirt?" "Red" "Blue" "Black" "Green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/109.jpg" +"110" "C" "What color is the backpack carried by the man wearing a yellow shirt?" "Black" "Red" "Blue" "Green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/110.jpg" +"111" "D" "What color is the backpack carried by the man wearing a yellow shirt?" "Black" "Red" "Green" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/111.jpg" +"112" "A" "On which side of the man wearing a yellow shirt is the girl wearing a blue top sitting?" "Left" "Directly in front" "Right" "Behind" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/112.jpg" +"113" "B" "On which side of the man wearing a yellow shirt is the girl wearing a blue top sitting?" "Directly in front" "Left" "Right" "Behind" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/113.jpg" +"114" "C" "On which side of the man wearing a yellow shirt is the girl wearing a blue top sitting?" "Right" "Behind" "Left" "Directly in front" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/114.jpg" +"115" "D" "On which side of the man wearing a yellow shirt is the girl wearing a blue top sitting?" "Behind" "Directly in front" "Right" "Left" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/115.jpg" +"116" "A" "What is the time shown on the clock?" "Approximately 11:00" "Approximately 12:15" "Approximately 12:00" "Approximately 11:10" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/116.jpg" +"117" "B" "What is the time shown on the clock?" "Approximately 11:10" "Approximately 11:00" "Approximately 12:00" "Approximately 12:15" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/117.jpg" +"118" "C" "What is the time shown on the clock?" "Approximately 12:00" "Approximately 12:15" "Approximately 11:00" "Approximately 11:10" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/118.jpg" +"119" "D" "What is the time shown on the clock?" "Approximately 12:00" "Approximately 11:10" "Approximately 12:15" "Approximately 11:00" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/119.jpg" +"120" "A" "Which direction is the river flowing relative to the clock tower?" "To the right" "Towards the clock tower" "To the left" "Away from the clock tower" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/120.jpg" +"121" "B" "Which direction is the river flowing relative to the clock tower?" "Towards the clock tower" "To the right" "Away from the clock tower" "To the left" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/121.jpg" +"122" "C" "Which direction is the river flowing relative to the clock tower?" "Away from the clock tower" "To the left" "To the right" "Towards the clock tower" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/122.jpg" +"123" "D" "Which direction is the river flowing relative to the clock tower?" "To the left" "Away from the clock tower" "Towards the clock tower" "To the right" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/123.jpg" +"124" "A" "What's located in the middle of the water?" "A small island with a tree" "A small island with a statue" "A small island with a bench" "A small island with a gazebo" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/124.jpg" +"125" "B" "What's located in the middle of the water?" "A small island with a statue" "A small island with a tree" "A small island with a gazebo" "A small island with a bench" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/125.jpg" +"126" "C" "What's located in the middle of the water?" "A small island with a bench" "A small island with a gazebo" "A small island with a tree" "A small island with a statue" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/126.jpg" +"127" "D" "What's located in the middle of the water?" "A small island with a bench" "A small island with a statue" "A small island with a gazebo" "A small island with a tree" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/127.jpg" +"128" "A" "What is the speed limit indicated by the sign in the image?" "20 km/h" "15 km/h" "30 km/h" "25 km/h" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/128.jpg" +"129" "B" "What is the speed limit indicated by the sign in the image?" "30 km/h" "20 km/h" "15 km/h" "25 km/h" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/129.jpg" +"130" "C" "What is the speed limit indicated by the sign in the image?" "15 km/h" "30 km/h" "20 km/h" "25 km/h" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/130.jpg" +"131" "D" "What is the speed limit indicated by the sign in the image?" "25 km/h" "30 km/h" "15 km/h" "20 km/h" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/131.jpg" +"132" "A" "What is the year inscribed on the sundial?" "1762" "1768" "1752" "1782" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/132.jpg" +"133" "B" "What is the year inscribed on the sundial?" "1752" "1762" "1782" "1768" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/133.jpg" +"134" "C" "What is the year inscribed on the sundial?" "1782" "1768" "1762" "1752" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/134.jpg" +"135" "D" "What is the year inscribed on the sundial?" "1782" "1768" "1752" "1762" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/135.jpg" +"136" "A" "What is the message written on the sign?" "KHU VUC NGUY HIEM KHONG NHAY" "KHU VUC NGUY HIEM KHONG NHAT" "KHU VUC AN TOAN KHONG NHAY" "KHU VUC NGUY HIEM KHONA NHAT" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/136.jpg" +"137" "B" "What is the message written on the sign?" "KHU VUC NGUY HIEM KHONG NHAT" "KHU VUC NGUY HIEM KHONG NHAY" "KHU VUC AN TOAN KHONG NHAY" "KHU VUC NGUY HIEM KHONA NHAT" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/137.jpg" +"138" "C" "What is the message written on the sign?" "KHU VUC AN TOAN KHONG NHAY" "KHU VUC NGUY HIEM KHONG NHAT" "KHU VUC NGUY HIEM KHONG NHAY" "KHU VUC NGUY HIEM KHONA NHAT" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/138.jpg" +"139" "D" "What is the message written on the sign?" "KHU VUC AN TOAN KHONG NHAY" "KHU VUC NGUY HIEM KHONA NHAT" "KHU VUC NGUY HIEM KHONG NHAT" "KHU VUC NGUY HIEM KHONG NHAY" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/139.jpg" +"140" "A" "What are the hazard numbers displayed on the left side storage container's label?" "1,3" "1" "1,2" "2,3" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/140.jpg" +"141" "B" "What are the hazard numbers displayed on the left side storage container's label?" "1" "1,3" "2,3" "1,2" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/141.jpg" +"142" "C" "What are the hazard numbers displayed on the left side storage container's label?" "2,3" "1,2" "1,3" "1" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/142.jpg" +"143" "D" "What are the hazard numbers displayed on the left side storage container's label?" "1" "1,2" "2,3" "1,3" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/143.jpg" +"144" "A" "What is the color of the ""1"" on the left side hazard label of the storage container?" "Yellow" "Red" "Green" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/144.jpg" +"145" "B" "What is the color of the ""1"" on the left side hazard label of the storage container?" "Blue" "Yellow" "Green" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/145.jpg" +"146" "C" "What is the color of the ""1"" on the left side hazard label of the storage container?" "Blue" "Green" "Yellow" "Red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/146.jpg" +"147" "D" "What is the color of the ""1"" on the left side hazard label of the storage container?" "Green" "Blue" "Red" "Yellow" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/147.jpg" +"148" "A" "What's the color of the Surveillance camera?" "Off-White" "Blue" "there is no Surveillance camera" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/148.jpg" +"149" "B" "What's the color of the Surveillance camera?" "there is no Surveillance camera" "Off-White" "Red" "Blue" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/149.jpg" +"150" "C" "What's the color of the Surveillance camera?" "Blue" "Red" "Off-White" "there is no Surveillance camera" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/150.jpg" +"151" "D" "What's the color of the Surveillance camera?" "there is no Surveillance camera" "Red" "Blue" "Off-White" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/151.jpg" +"152" "A" "What's the text written on the sign attached to the wall of building?" "Rue Saint-Paul" "Rue Saint-Jean" "Rue Sainte-Marie" "Rue Saint-Pierre" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/152.jpg" +"153" "B" "What's the text written on the sign attached to the wall of building?" "Rue Saint-Pierre" "Rue Saint-Paul" "Rue Sainte-Marie" "Rue Saint-Jean" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/153.jpg" +"154" "C" "What's the text written on the sign attached to the wall of building?" "Rue Saint-Pierre" "Rue Sainte-Marie" "Rue Saint-Paul" "Rue Saint-Jean" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/154.jpg" +"155" "D" "What's the text written on the sign attached to the wall of building?" "Rue Saint-Jean" "Rue Saint-Pierre" "Rue Sainte-Marie" "Rue Saint-Paul" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/155.jpg" +"156" "A" "What's the color of the car?" "Red" "Green" "Yellow" "Black" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/156.jpg" +"157" "B" "What's the color of the car?" "Yellow" "Red" "Green" "Black" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/157.jpg" +"158" "C" "What's the color of the car?" "Green" "Black" "Red" "Yellow" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/158.jpg" +"159" "D" "What's the color of the car?" "Green" "Black" "Yellow" "Red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/159.jpg" +"160" "A" "What color is the girl's shirt?" "Pink" "Yellow" "White" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/160.jpg" +"161" "B" "What color is the girl's shirt?" "White" "Pink" "Yellow" "Blue" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/161.jpg" +"162" "C" "What color is the girl's shirt?" "White" "Yellow" "Pink" "Blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/162.jpg" +"163" "D" "What color is the girl's shirt?" "White" "Yellow" "Blue" "Pink" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/163.jpg" +"164" "A" "What's color of the car?" "White" "Pink" "Blue" "Yellow" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/164.jpg" +"165" "B" "What's color of the car?" "Pink" "White" "Yellow" "Blue" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/165.jpg" +"166" "C" "What's color of the car?" "Yellow" "Pink" "White" "Blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/166.jpg" +"167" "D" "What's color of the car?" "Blue" "Yellow" "Pink" "White" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/167.jpg" +"168" "A" "What's the primary color of the person's clothing in the image?" "Blue" "White" "Green" "Yellow" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/168.jpg" +"169" "B" "What's the primary color of the person's clothing in the image?" "Green" "Blue" "White" "Yellow" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/169.jpg" +"170" "C" "What's the primary color of the person's clothing in the image?" "Green" "Yellow" "Blue" "White" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/170.jpg" +"171" "D" "What's the primary color of the person's clothing in the image?" "Green" "White" "Yellow" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/171.jpg" +"172" "A" "What's the color of the flag in the image?" "Blue, white and red" "Black and white" "Black, white and red" "Black and red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/172.jpg" +"173" "B" "What's the color of the flag in the image?" "Black and white" "Blue, white and red" "Black, white and red" "Black and red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/173.jpg" +"174" "C" "What's the color of the flag in the image?" "Black and red" "Black and white" "Blue, white and red" "Black, white and red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/174.jpg" +"175" "D" "What's the color of the flag in the image?" "Black and white" "Black and red" "Black, white and red" "Blue, white and red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/175.jpg" +"176" "A" "What street is indicated by the sign on the pole near the center bottom of the image?" "MICHIGAN" "MACHLGUN" "MICHIGUN" "MACHIGAN" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/176.jpg" +"177" "B" "What street is indicated by the sign on the pole near the center bottom of the image?" "MACHIGAN" "MICHIGAN" "MACHLGUN" "MICHIGUN" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/177.jpg" +"178" "C" "What street is indicated by the sign on the pole near the center bottom of the image?" "MACHLGUN" "MICHIGUN" "MICHIGAN" "MACHIGAN" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/178.jpg" +"179" "D" "What street is indicated by the sign on the pole near the center bottom of the image?" "MACHIGAN" "MACHLGUN" "MICHIGUN" "MICHIGAN" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/179.jpg" +"180" "A" "What's the number written on the boat?" "15" "5" "10" "25" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/180.jpg" +"181" "B" "What's the number written on the boat?" "10" "15" "5" "25" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/181.jpg" +"182" "C" "What's the number written on the boat?" "25" "10" "15" "5" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/182.jpg" +"183" "D" "What's the number written on the boat?" "10" "5" "25" "15" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/183.jpg" +"184" "A" "What color is the shirt worn by the person in the image?" "Blue" "Red" "Green" "Yellow" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/184.jpg" +"185" "B" "What color is the shirt worn by the person in the image?" "Yellow" "Blue" "Green" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/185.jpg" +"186" "C" "What color is the shirt worn by the person in the image?" "Red" "Yellow" "Blue" "Green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/186.jpg" +"187" "D" "What color is the shirt worn by the person in the image?" "Yellow" "Green" "Red" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/187.jpg" +"188" "A" "What's color of the flag?" "White" "Yellow" "Red" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/188.jpg" +"189" "B" "What's color of the flag?" "Red" "White" "Blue" "Yellow" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/189.jpg" +"190" "C" "What's color of the flag?" "Blue" "Yellow" "White" "Red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/190.jpg" +"191" "D" "What's color of the flag?" "Blue" "Red" "Yellow" "White" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/191.jpg" +"192" "A" "What's the color of the uniform of the figurine on the shelf?" "White" "Green" "Blue" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/192.jpg" +"193" "B" "What's the color of the uniform of the figurine on the shelf?" "Blue" "White" "Green" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/193.jpg" +"194" "C" "What's the color of the uniform of the figurine on the shelf?" "Blue" "Red" "White" "Green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/194.jpg" +"195" "D" "What's the color of the uniform of the figurine on the shelf?" "Green" "Red" "Blue" "White" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/195.jpg" +"196" "A" "What's the color of the visible vehicle in the image?" "White" "Red" "Black" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/196.jpg" +"197" "B" "What's the color of the visible vehicle in the image?" "Blue" "White" "Black" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/197.jpg" +"198" "C" "What's the color of the visible vehicle in the image?" "Blue" "Black" "White" "Red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/198.jpg" +"199" "D" "What's the color of the visible vehicle in the image?" "Black" "Red" "Blue" "White" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/199.jpg" +"200" "A" "What's the color of the climber's hat?" "Red" "Blue" "Black" "White" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/200.jpg" +"201" "B" "What's the color of the climber's hat?" "Blue" "Red" "White" "Black" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/201.jpg" +"202" "C" "What's the color of the climber's hat?" "Black" "Blue" "Red" "White" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/202.jpg" +"203" "D" "What's the color of the climber's hat?" "White" "Blue" "Black" "Red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/203.jpg" +"204" "A" "What's the color of the trailer?" "Orange" "Black" "White" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/204.jpg" +"205" "B" "What's the color of the trailer?" "Black" "Orange" "White" "Blue" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/205.jpg" +"206" "C" "What's the color of the trailer?" "White" "Blue" "Orange" "Black" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/206.jpg" +"207" "D" "What's the color of the trailer?" "Black" "Blue" "White" "Orange" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/207.jpg" +"208" "A" "What's the phone number written on the boat?" "0905 87 38 38" "0905 87 36 38" "0905 87 39 38" "0905 87 38 28" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/208.jpg" +"209" "B" "What's the phone number written on the boat?" "0905 87 38 28" "0905 87 38 38" "0905 87 39 38" "0905 87 36 38" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/209.jpg" +"210" "C" "What's the phone number written on the boat?" "0905 87 38 28" "0905 87 39 38" "0905 87 38 38" "0905 87 36 38" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/210.jpg" +"211" "D" "What's the phone number written on the boat?" "0905 87 36 38" "0905 87 39 38" "0905 87 38 28" "0905 87 38 38" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/211.jpg" +"212" "A" "What's the color of the motorcycle?" "Red" "Green" "Yellow" "White" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/212.jpg" +"213" "B" "What's the color of the motorcycle?" "Yellow" "Red" "White" "Green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/213.jpg" +"214" "C" "What's the color of the motorcycle?" "Yellow" "White" "Red" "Green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/214.jpg" +"215" "D" "What's the color of the motorcycle?" "Yellow" "White" "Green" "Red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/215.jpg" +"216" "A" "What is the title of the book displayed prominently on the stand?" "Holy Bible" "Book of Common Prayer" "Winchester Psalter" "Hymnal" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/216.jpg" +"217" "B" "What is the title of the book displayed prominently on the stand?" "Book of Common Prayer" "Holy Bible" "Winchester Psalter" "Hymnal" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/217.jpg" +"218" "C" "What is the title of the book displayed prominently on the stand?" "Book of Common Prayer" "Winchester Psalter" "Holy Bible" "Hymnal" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/218.jpg" +"219" "D" "What is the title of the book displayed prominently on the stand?" "Book of Common Prayer" "Winchester Psalter" "Hymnal" "Holy Bible" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/219.jpg" +"220" "A" "What color are the flowers?" "Purple" "Red" "Yellow" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/220.jpg" +"221" "B" "What color are the flowers?" "Blue" "Purple" "Yellow" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/221.jpg" +"222" "C" "What color are the flowers?" "Yellow" "Red" "Purple" "Blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/222.jpg" +"223" "D" "What color are the flowers?" "Red" "Yellow" "Blue" "Purple" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/223.jpg" +"224" "A" "What is the phone number listed on the building in the foreground?" "206 441 5000" "206 451 5000" "206 444 5000" "206 441 4000" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/224.jpg" +"225" "B" "What is the phone number listed on the building in the foreground?" "206 441 4000" "206 441 5000" "206 444 5000" "206 451 5000" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/225.jpg" +"226" "C" "What is the phone number listed on the building in the foreground?" "206 444 5000" "206 441 4000" "206 441 5000" "206 451 5000" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/226.jpg" +"227" "D" "What is the phone number listed on the building in the foreground?" "206 444 5000" "206 441 4000" "206 451 5000" "206 441 5000" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/227.jpg" +"228" "A" "What is the number written on the blue tag?" "23" "32" "25" "21" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/228.jpg" +"229" "B" "What is the number written on the blue tag?" "25" "23" "21" "32" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/229.jpg" +"230" "C" "What is the number written on the blue tag?" "32" "21" "23" "25" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/230.jpg" +"231" "D" "What is the number written on the blue tag?" "25" "21" "32" "23" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/231.jpg" +"232" "A" "What is the registration number of the boat?" "TN-01-00026" "TN-01-00216" "TN-02-00056" "TN-03-00026" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/232.jpg" +"233" "B" "What is the registration number of the boat?" "TN-03-00026" "TN-01-00026" "TN-02-00056" "TN-01-00216" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/233.jpg" +"234" "C" "What is the registration number of the boat?" "TN-01-00216" "TN-02-00056" "TN-01-00026" "TN-03-00026" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/234.jpg" +"235" "D" "What is the registration number of the boat?" "TN-02-00056" "TN-03-00026" "TN-01-00216" "TN-01-00026" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/235.jpg" +"236" "A" "What is the color of the flag flying on the top of the boat?" "Yellow, blue and red" "Black, yellow and green" "Green, white and red" "Blue, white and red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/236.jpg" +"237" "B" "What is the color of the flag flying on the top of the boat?" "Blue, white and red" "Yellow, blue and red" "Green, white and red" "Black, yellow and green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/237.jpg" +"238" "C" "What is the color of the flag flying on the top of the boat?" "Black, yellow and green" "Green, white and red" "Yellow, blue and red" "Blue, white and red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/238.jpg" +"239" "D" "What is the color of the flag flying on the top of the boat?" "Black, yellow and green" "Green, white and red" "Blue, white and red" "Yellow, blue and red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/239.jpg" +"240" "A" "What is the model number of the train shown in the image?" "2001" "3001" "1002" "4005" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/240.jpg" +"241" "B" "What is the model number of the train shown in the image?" "1002" "2001" "3001" "4005" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/241.jpg" +"242" "C" "What is the model number of the train shown in the image?" "3001" "1002" "2001" "4005" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/242.jpg" +"243" "D" "What is the model number of the train shown in the image?" "4005" "1002" "3001" "2001" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/243.jpg" +"244" "A" "What is the color of the shirt worn by the person in the image?" "Blue" "Black" "Green" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/244.jpg" +"245" "B" "What is the color of the shirt worn by the person in the image?" "Red" "Blue" "Green" "Black" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/245.jpg" +"246" "C" "What is the color of the shirt worn by the person in the image?" "Green" "Red" "Blue" "Black" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/246.jpg" +"247" "D" "What is the color of the shirt worn by the person in the image?" "Black" "Red" "Green" "Blue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/247.jpg" +"248" "A" "What is written on the black and white sign above the parking garage entrance?" "Public Parking" "Loading Zone" "No Entry" "Reserved Parking" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/248.jpg" +"249" "B" "What is written on the black and white sign above the parking garage entrance?" "Reserved Parking" "Public Parking" "No Entry" "Loading Zone" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/249.jpg" +"250" "C" "What is written on the black and white sign above the parking garage entrance?" "No Entry" "Reserved Parking" "Public Parking" "Loading Zone" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/250.jpg" +"251" "D" "What is written on the black and white sign above the parking garage entrance?" "Reserved Parking" "Loading Zone" "No Entry" "Public Parking" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/251.jpg" +"252" "A" "What is the license plate number of the vehicle in the image?" "V-223-LV" "V-322-LV" "V-224-LV" "V-223-LW" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/252.jpg" +"253" "B" "What is the license plate number of the vehicle in the image?" "V-223-LW" "V-223-LV" "V-322-LV" "V-224-LV" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/253.jpg" +"254" "C" "What is the license plate number of the vehicle in the image?" "V-223-LW" "V-224-LV" "V-223-LV" "V-322-LV" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/254.jpg" +"255" "D" "What is the license plate number of the vehicle in the image?" "V-224-LV" "V-322-LV" "V-223-LW" "V-223-LV" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/255.jpg" +"256" "A" "What is the position of the person relative to the car?" "Top left" "Behind the car" "bottom right" "On the right" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/256.jpg" +"257" "B" "What is the position of the person relative to the car?" "Behind the car" "Top left" "On the right" "bottom right" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/257.jpg" +"258" "C" "What is the position of the person relative to the car?" "Behind the car" "On the right" "Top left" "bottom right" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/258.jpg" +"259" "D" "What is the position of the person relative to the car?" "Behind the car" "bottom right" "On the right" "Top left" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/259.jpg" +"260" "A" "What is the color of the car in the image?" "Black" "Green" "No car in the image" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/260.jpg" +"261" "B" "What is the color of the car in the image?" "Red" "Black" "Green" "No car in the image" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/261.jpg" +"262" "C" "What is the color of the car in the image?" "Green" "Red" "Black" "No car in the image" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/262.jpg" +"263" "D" "What is the color of the car in the image?" "Red" "Green" "No car in the image" "Black" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/263.jpg" +"264" "A" "What is the color of the pants worn by the person in the image?" "Black" "No person in the image" "Blue" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/264.jpg" +"265" "B" "What is the color of the pants worn by the person in the image?" "Blue" "Black" "Red" "No person in the image" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/265.jpg" +"266" "C" "What is the color of the pants worn by the person in the image?" "Red" "Blue" "Black" "No person in the image" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/266.jpg" +"267" "D" "What is the color of the pants worn by the person in the image?" "No person in the image" "Red" "Blue" "Black" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/267.jpg" +"268" "A" "What is the color of the flag?" "Red, yellow and green" "Blue, yellow and red" "Red, white and green" "Green, white and red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/268.jpg" +"269" "B" "What is the color of the flag?" "Blue, yellow and red" "Red, yellow and green" "Green, white and red" "Red, white and green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/269.jpg" +"270" "C" "What is the color of the flag?" "Blue, yellow and red" "Red, white and green" "Red, yellow and green" "Green, white and red" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/270.jpg" +"271" "D" "What is the color of the flag?" "Red, white and green" "Green, white and red" "Blue, yellow and red" "Red, yellow and green" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/271.jpg" +"272" "A" "What is the color of the trash can?" "Black" "Blue" "Yellow" "White" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/272.jpg" +"273" "B" "What is the color of the trash can?" "White" "Black" "Yellow" "Blue" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/273.jpg" +"274" "C" "What is the color of the trash can?" "Yellow" "White" "Black" "Blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/274.jpg" +"275" "D" "What is the color of the trash can?" "Blue" "White" "Yellow" "Black" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/275.jpg" +"276" "A" "What's the color of the dog?" "Black and white" "Yellow and green" "Pink" "Green and red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/276.jpg" +"277" "B" "What's the color of the dog?" "Green and red" "Black and white" "Yellow and green" "Pink" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/277.jpg" +"278" "C" "What's the color of the dog?" "Green and red" "Yellow and green" "Black and white" "Pink" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/278.jpg" +"279" "D" "What's the color of the dog?" "Pink" "Green and red" "Yellow and green" "Black and white" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/279.jpg" +"280" "A" "What are the letters written on the green trash bin?" "VP" "VD" "GP" "VA" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/280.jpg" +"281" "B" "What are the letters written on the green trash bin?" "GP" "VP" "VD" "VA" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/281.jpg" +"282" "C" "What are the letters written on the green trash bin?" "GP" "VA" "VP" "VD" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/282.jpg" +"283" "D" "What are the letters written on the green trash bin?" "VD" "GP" "VA" "VP" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/283.jpg" +"284" "A" "What direction arrows are shown on the black sign?" "Two left arrows" "Two right arrows" "No arrows" "Both left and right arrows" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/284.jpg" +"285" "B" "What direction arrows are shown on the black sign?" "Both left and right arrows" "Two left arrows" "No arrows" "Two right arrows" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/285.jpg" +"286" "C" "What direction arrows are shown on the black sign?" "Two right arrows" "No arrows" "Two left arrows" "Both left and right arrows" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/286.jpg" +"287" "D" "What direction arrows are shown on the black sign?" "Two right arrows" "No arrows" "Both left and right arrows" "Two left arrows" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/287.jpg" +"288" "A" "What text is written at the center of the black sign?" "ISTRE.PULA" "ISPRS.PULV" "ISTRR.PUIA" "ISPRS.PUSH" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/288.jpg" +"289" "B" "What text is written at the center of the black sign?" "ISPRS.PUSH" "ISTRE.PULA" "ISTRR.PUIA" "ISPRS.PULV" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/289.jpg" +"290" "C" "What text is written at the center of the black sign?" "ISPRS.PUSH" "ISPRS.PULV" "ISTRE.PULA" "ISTRR.PUIA" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/290.jpg" +"291" "D" "What text is written at the center of the black sign?" "ISPRS.PULV" "ISPRS.PUSH" "ISTRR.PUIA" "ISTRE.PULA" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/291.jpg" +"292" "A" "What's the number on the rectangular white sign?" "3" "8" "1" "5" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/292.jpg" +"293" "B" "What's the number on the rectangular white sign?" "1" "3" "5" "8" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/293.jpg" +"294" "C" "What's the number on the rectangular white sign?" "1" "5" "3" "8" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/294.jpg" +"295" "D" "What's the number on the rectangular white sign?" "5" "1" "8" "3" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/295.jpg" +"296" "A" "Tell me the text on the white building." "The text on the white building is ""DB""" "The text on the white building is ""AB""" "The text on the white building is ""DE""" "The text on the white building is ""CB""" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/296.jpg" +"297" "B" "Tell me the text on the white building." "The text on the white building is ""CB""" "The text on the white building is ""DB""" "The text on the white building is ""AB""" "The text on the white building is ""DE""" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/297.jpg" +"298" "C" "Tell me the text on the white building." "The text on the white building is ""AB""" "The text on the white building is ""CB""" "The text on the white building is ""DB""" "The text on the white building is ""DE""" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/298.jpg" +"299" "D" "Tell me the text on the white building." "The text on the white building is ""CB""" "The text on the white building is ""DE""" "The text on the white building is ""AB""" "The text on the white building is ""DB""" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/299.jpg" +"300" "A" "Which building has a red and white striped antenna on its top?" "The building with the Helaba logo" "The building with the DB logo" "The building with the Deutsche Bank logo" "The building with the Commerzbank logo" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/300.jpg" +"301" "B" "Which building has a red and white striped antenna on its top?" "The building with the Commerzbank logo" "The building with the Helaba logo" "The building with the DB logo" "The building with the Deutsche Bank logo" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/301.jpg" +"302" "C" "Which building has a red and white striped antenna on its top?" "The building with the Deutsche Bank logo" "The building with the Commerzbank logo" "The building with the Helaba logo" "The building with the DB logo" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/302.jpg" +"303" "D" "Which building has a red and white striped antenna on its top?" "The building with the DB logo" "The building with the Deutsche Bank logo" "The building with the Commerzbank logo" "The building with the Helaba logo" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/303.jpg" +"304" "A" "What is the material of the ceiling beams in the room?" "Wood" "Plastic" "Stone" "Metal" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/304.jpg" +"305" "B" "What is the material of the ceiling beams in the room?" "Stone" "Wood" "Metal" "Plastic" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/305.jpg" +"306" "C" "What is the material of the ceiling beams in the room?" "Metal" "Stone" "Wood" "Plastic" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/306.jpg" +"307" "D" "What is the material of the ceiling beams in the room?" "Stone" "Plastic" "Metal" "Wood" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/307.jpg" +"308" "A" "Where is the small stone cairn located relative to the waterfall?" "At the bottom right of the waterfall" "In the middle of the waterfall" "At the top of the waterfall" "To the left of the waterfall" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/308.jpg" +"309" "B" "Where is the small stone cairn located relative to the waterfall?" "In the middle of the waterfall" "At the bottom right of the waterfall" "To the left of the waterfall" "At the top of the waterfall" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/309.jpg" +"310" "C" "Where is the small stone cairn located relative to the waterfall?" "To the left of the waterfall" "In the middle of the waterfall" "At the bottom right of the waterfall" "At the top of the waterfall" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/310.jpg" +"311" "D" "Where is the small stone cairn located relative to the waterfall?" "In the middle of the waterfall" "At the top of the waterfall" "To the left of the waterfall" "At the bottom right of the waterfall" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/311.jpg" +"312" "A" "What is hanging on the wall inside the house?" "A piece of cloth" "A picture frame" "A clock" "A hat" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/312.jpg" +"313" "B" "What is hanging on the wall inside the house?" "A picture frame" "A piece of cloth" "A hat" "A clock" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/313.jpg" +"314" "C" "What is hanging on the wall inside the house?" "A hat" "A picture frame" "A piece of cloth" "A clock" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/314.jpg" +"315" "D" "What is hanging on the wall inside the house?" "A clock" "A picture frame" "A hat" "A piece of cloth" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/315.jpg" +"316" "A" "What is the object mounted on the wall in the background?" "A notice" "A clock" "A mirror" "A light" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/316.jpg" +"317" "B" "What is the object mounted on the wall in the background?" "A mirror" "A notice" "A light" "A clock" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/317.jpg" +"318" "C" "What is the object mounted on the wall in the background?" "A light" "A clock" "A notice" "A mirror" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/318.jpg" +"319" "D" "What is the object mounted on the wall in the background?" "A light" "A mirror" "A clock" "A notice" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/319.jpg" +"320" "A" "What is the color of the cup?" "Brown" "Blue" "Red" "Black" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/320.jpg" +"321" "B" "What is the color of the cup?" "Black" "Brown" "Blue" "Red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/321.jpg" +"322" "C" "What is the color of the cup?" "Black" "Red" "Brown" "Blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/322.jpg" +"323" "D" "What is the color of the cup?" "Red" "Black" "Blue" "Brown" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/323.jpg" +"324" "A" "What is the primary material of the cup lying on the ground?" "Cardboard" "Metal" "Plastic" "Glass" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/324.jpg" +"325" "B" "What is the primary material of the cup lying on the ground?" "Metal" "Cardboard" "Glass" "Plastic" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/325.jpg" +"326" "C" "What is the primary material of the cup lying on the ground?" "Glass" "Metal" "Cardboard" "Plastic" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/326.jpg" +"327" "D" "What is the primary material of the cup lying on the ground?" "Plastic" "Glass" "Metal" "Cardboard" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/327.jpg" +"328" "A" "What is the object located in the center of the grassy area?" "A statue" "A tree" "A rockery" "A fountain" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/328.jpg" +"329" "B" "What is the object located in the center of the grassy area?" "A rockery" "A statue" "A fountain" "A tree" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/329.jpg" +"330" "C" "What is the object located in the center of the grassy area?" "A fountain" "A tree" "A statue" "A rockery" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/330.jpg" +"331" "D" "What is the object located in the center of the grassy area?" "A rockery" "A tree" "A fountain" "A statue" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/331.jpg" +"332" "A" "What is the direction indicated on the sign pointing towards Zaragoza?" "Straight" "Left" "Downward" "Right" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/332.jpg" +"333" "B" "What is the direction indicated on the sign pointing towards Zaragoza?" "Right" "Straight" "Left" "Downward" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/333.jpg" +"334" "C" "What is the direction indicated on the sign pointing towards Zaragoza?" "Right" "Left" "Straight" "Downward" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/334.jpg" +"335" "D" "What is the direction indicated on the sign pointing towards Zaragoza?" "Downward" "Left" "Right" "Straight" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/335.jpg" +"336" "A" "What is the direction indicated on the sign pointing towards Alocén?" "Left" "Downward" "Straight" "Right" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/336.jpg" +"337" "B" "What is the direction indicated on the sign pointing towards Alocén?" "Straight" "Left" "Downward" "Right" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/337.jpg" +"338" "C" "What is the direction indicated on the sign pointing towards Alocén?" "Straight" "Right" "Left" "Downward" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/338.jpg" +"339" "D" "What is the direction indicated on the sign pointing towards Alocén?" "Downward" "Straight" "Right" "Left" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/339.jpg" +"340" "A" "What color is the car?" "White" "Black" "Blue" "Red" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/340.jpg" +"341" "B" "What color is the car?" "Red" "White" "Blue" "Black" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/341.jpg" +"342" "C" "What color is the car?" "Blue" "Red" "White" "Black" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/342.jpg" +"343" "D" "What color is the car?" "Black" "Blue" "Red" "White" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/343.jpg" +"344" "A" "What is the speed limit indicated on the sign in the image?" "30 km/h" "40 km/h" "60 km/h" "20 km/h" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/344.jpg" +"345" "B" "What is the speed limit indicated on the sign in the image?" "20 km/h" "30 km/h" "40 km/h" "60 km/h" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/345.jpg" +"346" "C" "What is the speed limit indicated on the sign in the image?" "20 km/h" "60 km/h" "30 km/h" "40 km/h" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/346.jpg" +"347" "D" "What is the speed limit indicated on the sign in the image?" "20 km/h" "40 km/h" "60 km/h" "30 km/h" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/347.jpg" +"348" "A" "What is the color of the flag?" "Red" "Blue" "Black" "White" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/348.jpg" +"349" "B" "What is the color of the flag?" "Black" "Red" "White" "Blue" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/349.jpg" +"350" "C" "What is the color of the flag?" "Black" "Blue" "Red" "White" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/350.jpg" +"351" "D" "What is the color of the flag?" "Blue" "Black" "White" "Red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/351.jpg" +"352" "A" "What is the name written on the boat?" "GONDOLA" "GENDOLA" "GENDALA" "GODOLA" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/352.jpg" +"353" "B" "What is the name written on the boat?" "GENDALA" "GONDOLA" "GENDOLA" "GODOLA" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/353.jpg" +"354" "C" "What is the name written on the boat?" "GODOLA" "GENDALA" "GONDOLA" "GENDOLA" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/354.jpg" +"355" "D" "What is the name written on the boat?" "GODOLA" "GENDOLA" "GENDALA" "GONDOLA" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/355.jpg" +"356" "A" "What is the speed limit indicated by the sign?" "30 km/h" "60 km/h" "50 km/h" "20 km/h" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/356.jpg" +"357" "B" "What is the speed limit indicated by the sign?" "50 km/h" "30 km/h" "20 km/h" "60 km/h" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/357.jpg" +"358" "C" "What is the speed limit indicated by the sign?" "50 km/h" "20 km/h" "30 km/h" "60 km/h" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/358.jpg" +"359" "D" "What is the speed limit indicated by the sign?" "60 km/h" "20 km/h" "50 km/h" "30 km/h" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/359.jpg" +"360" "A" "What is the name written on the front of the boat?" "Freedom" "Independence" "Froodom" "Liberty" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/360.jpg" +"361" "B" "What is the name written on the front of the boat?" "Independence" "Freedom" "Liberty" "Froodom" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/361.jpg" +"362" "C" "What is the name written on the front of the boat?" "Independence" "Liberty" "Freedom" "Froodom" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/362.jpg" +"363" "D" "What is the name written on the front of the boat?" "Froodom" "Independence" "Liberty" "Freedom" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/363.jpg" +"364" "A" "What is the color of the flag?" "Red and white" "Green and red" "Blue and white" "Yellow and black" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/364.jpg" +"365" "B" "What is the color of the flag?" "Blue and white" "Red and white" "Yellow and black" "Green and red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/365.jpg" +"366" "C" "What is the color of the flag?" "Green and red" "Blue and white" "Red and white" "Yellow and black" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/366.jpg" +"367" "D" "What is the color of the flag?" "Green and red" "Blue and white" "Yellow and black" "Red and white" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/367.jpg" +"368" "A" "What is the position of the Royal Albert Hall relative to the bus?" "To the left of the bus" "Directly behind the bus" "In front of the bus" "To the right of the bus" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/368.jpg" +"369" "B" "What is the position of the Royal Albert Hall relative to the bus?" "Directly behind the bus" "To the left of the bus" "In front of the bus" "To the right of the bus" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/369.jpg" +"370" "C" "What is the position of the Royal Albert Hall relative to the bus?" "To the right of the bus" "Directly behind the bus" "To the left of the bus" "In front of the bus" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/370.jpg" +"371" "D" "What is the position of the Royal Albert Hall relative to the bus?" "To the right of the bus" "Directly behind the bus" "In front of the bus" "To the left of the bus" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/371.jpg" +"372" "A" "Where are the houses located relative to the tea fields?" "At the top right corner" "In the bottom center" "At the top left corner" "In the middle of the tea fields" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/372.jpg" +"373" "B" "Where are the houses located relative to the tea fields?" "In the middle of the tea fields" "At the top right corner" "At the top left corner" "In the bottom center" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/373.jpg" +"374" "C" "Where are the houses located relative to the tea fields?" "In the bottom center" "In the middle of the tea fields" "At the top right corner" "At the top left corner" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/374.jpg" +"375" "D" "Where are the houses located relative to the tea fields?" "In the bottom center" "In the middle of the tea fields" "At the top left corner" "At the top right corner" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/375.jpg" +"376" "A" "What is the relative position of the white truck compared to the trams in the image?" "To the right of the trams" "To the left of the trams" "Bottom of the trams" "In top of the trams" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/376.jpg" +"377" "B" "What is the relative position of the white truck compared to the trams in the image?" "Bottom of the trams" "To the right of the trams" "In top of the trams" "To the left of the trams" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/377.jpg" +"378" "C" "What is the relative position of the white truck compared to the trams in the image?" "To the left of the trams" "In top of the trams" "To the right of the trams" "Bottom of the trams" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/378.jpg" +"379" "D" "What is the relative position of the white truck compared to the trams in the image?" "To the left of the trams" "In top of the trams" "Bottom of the trams" "To the right of the trams" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/379.jpg" +"380" "A" "What is the relative position of the red car compared to the black car?" "To the right of the black car" "To the left of the black car" "Behind the black car" "In front of the black car" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/380.jpg" +"381" "B" "What is the relative position of the red car compared to the black car?" "Behind the black car" "To the right of the black car" "To the left of the black car" "In front of the black car" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/381.jpg" +"382" "C" "What is the relative position of the red car compared to the black car?" "To the left of the black car" "Behind the black car" "To the right of the black car" "In front of the black car" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/382.jpg" +"383" "D" "What is the relative position of the red car compared to the black car?" "Behind the black car" "To the left of the black car" "In front of the black car" "To the right of the black car" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/383.jpg" +"384" "A" "What is the relative position of the pink banner compared to the green trash bin?" "To the left and slightly behind the green trash bin" "Directly above the green trash bin" "To the right and slightly in front of the green trash bin" "To the left and slightly in front of the green trash bin" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/384.jpg" +"385" "B" "What is the relative position of the pink banner compared to the green trash bin?" "To the right and slightly in front of the green trash bin" "To the left and slightly behind the green trash bin" "To the left and slightly in front of the green trash bin" "Directly above the green trash bin" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/385.jpg" +"386" "C" "What is the relative position of the pink banner compared to the green trash bin?" "To the left and slightly in front of the green trash bin" "Directly above the green trash bin" "To the left and slightly behind the green trash bin" "To the right and slightly in front of the green trash bin" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/386.jpg" +"387" "D" "What is the relative position of the pink banner compared to the green trash bin?" "To the right and slightly in front of the green trash bin" "Directly above the green trash bin" "To the left and slightly in front of the green trash bin" "To the left and slightly behind the green trash bin" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/387.jpg" +"388" "A" "What is the relative position of the person in light brown hat compared to the person wearing pink shirt?" "To the left of the person wearing the pink shirt" "To the right and slightly behind the person wearing the pink shirt" "Directly in front of the person wearing pink shirt" "To the right of the person wearing pink shirt" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/388.jpg" +"389" "B" "What is the relative position of the person in light brown hat compared to the person wearing pink shirt?" "To the right of the person wearing pink shirt" "To the left of the person wearing the pink shirt" "Directly in front of the person wearing pink shirt" "To the right and slightly behind the person wearing the pink shirt" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/389.jpg" +"390" "C" "What is the relative position of the person in light brown hat compared to the person wearing pink shirt?" "To the right of the person wearing pink shirt" "Directly in front of the person wearing pink shirt" "To the left of the person wearing the pink shirt" "To the right and slightly behind the person wearing the pink shirt" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/390.jpg" +"391" "D" "What is the relative position of the person in light brown hat compared to the person wearing pink shirt?" "To the right of the person wearing pink shirt" "Directly in front of the person wearing pink shirt" "To the right and slightly behind the person wearing the pink shirt" "To the left of the person wearing the pink shirt" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/391.jpg" +"392" "A" "What is the relative position of the white car compared to the large white building?" "To the left and behind the large white building" "To the left and in front of the large white building" "To the right and behind the large white building" "To the right and in front of the large white building" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/392.jpg" +"393" "B" "What is the relative position of the white car compared to the large white building?" "To the left and in front of the large white building" "To the left and behind the large white building" "To the right and in front of the large white building" "To the right and behind the large white building" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/393.jpg" +"394" "C" "What is the relative position of the white car compared to the large white building?" "To the right and in front of the large white building" "To the left and in front of the large white building" "To the left and behind the large white building" "To the right and behind the large white building" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/394.jpg" +"395" "D" "What is the relative position of the white car compared to the large white building?" "To the left and in front of the large white building" "To the right and behind the large white building" "To the right and in front of the large white building" "To the left and behind the large white building" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/395.jpg" +"396" "A" "What is the relative position of the black motorcycle compared to the silver car?" "To the left of the silver car" "Behind the silver car" "To the right of the silver car" "In front of the silver car" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/396.jpg" +"397" "B" "What is the relative position of the black motorcycle compared to the silver car?" "In front of the silver car" "To the left of the silver car" "To the right of the silver car" "Behind the silver car" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/397.jpg" +"398" "C" "What is the relative position of the black motorcycle compared to the silver car?" "In front of the silver car" "Behind the silver car" "To the left of the silver car" "To the right of the silver car" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/398.jpg" +"399" "D" "What is the relative position of the black motorcycle compared to the silver car?" "In front of the silver car" "To the right of the silver car" "Behind the silver car" "To the left of the silver car" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/399.jpg" +"400" "A" "What is the color of the flag on the left side?" "Black, red and yellow" "Green, white and orange" "Blue, white and red" "Red, white and orange" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/400.jpg" +"401" "B" "What is the color of the flag on the left side?" "Red, white and orange" "Black, red and yellow" "Blue, white and red" "Green, white and orange" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/401.jpg" +"402" "C" "What is the color of the flag on the left side?" "Green, white and orange" "Red, white and orange" "Black, red and yellow" "Blue, white and red" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/402.jpg" +"403" "D" "What is the color of the flag on the left side?" "Blue, white and red" "Green, white and orange" "Red, white and orange" "Black, red and yellow" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/403.jpg" +"404" "A" "What is the relative position of the small white building compared to the water?" "To the right of the water" "To the left of the water" "Behind the water" "In front of the water" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/404.jpg" +"405" "B" "What is the relative position of the small white building compared to the water?" "Behind the water" "To the right of the water" "In front of the water" "To the left of the water" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/405.jpg" +"406" "C" "What is the relative position of the small white building compared to the water?" "To the left of the water" "In front of the water" "To the right of the water" "Behind the water" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/406.jpg" +"407" "D" "What is the relative position of the small white building compared to the water?" "In front of the water" "Behind the water" "To the left of the water" "To the right of the water" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/407.jpg" +"408" "A" "How many computers are visible on the table?" "Five computers" "Three computers" "Four computers" "Two computers" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/408.jpg" +"409" "B" "How many computers are visible on the table?" "Three computers" "Five computers" "Two computers" "Four computers" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/409.jpg" +"410" "C" "How many computers are visible on the table?" "Two computers" "Four computers" "Five computers" "Three computers" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/410.jpg" +"411" "D" "How many computers are visible on the table?" "Four computers" "Three computers" "Two computers" "Five computers" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/411.jpg" +"412" "A" "What is the relative position of the American flag in the image?" "To the left of the bear statue" "Directly above the log" "Near the center of the image" "To the right of the bear statue" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/412.jpg" +"413" "B" "What is the relative position of the American flag in the image?" "To the right of the bear statue" "To the left of the bear statue" "Directly above the log" "Near the center of the image" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/413.jpg" +"414" "C" "What is the relative position of the American flag in the image?" "To the right of the bear statue" "Directly above the log" "To the left of the bear statue" "Near the center of the image" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/414.jpg" +"415" "D" "What is the relative position of the American flag in the image?" "Near the center of the image" "To the right of the bear statue" "Directly above the log" "To the left of the bear statue" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/415.jpg" +"416" "A" "Where is the ""OPEN"" sign located in the image?" "Near the center, under the roof" "Above the entrance to the building" "On the right side of the bear statue" "On the left side of the bear statue" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/416.jpg" +"417" "B" "Where is the ""OPEN"" sign located in the image?" "Above the entrance to the building" "Near the center, under the roof" "On the right side of the bear statue" "On the left side of the bear statue" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/417.jpg" +"418" "C" "Where is the ""OPEN"" sign located in the image?" "On the right side of the bear statue" "Above the entrance to the building" "Near the center, under the roof" "On the left side of the bear statue" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/418.jpg" +"419" "D" "Where is the ""OPEN"" sign located in the image?" "On the right side of the bear statue" "Above the entrance to the building" "On the left side of the bear statue" "Near the center, under the roof" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/419.jpg" +"420" "A" "What is the position of the totem pole in relation to the bear statue?" "To the left of the bear statue" "To the right of the bear statue" "Behind the bear statue" "In front of the bear statue" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/420.jpg" +"421" "B" "What is the position of the totem pole in relation to the bear statue?" "Behind the bear statue" "To the left of the bear statue" "To the right of the bear statue" "In front of the bear statue" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/421.jpg" +"422" "C" "What is the position of the totem pole in relation to the bear statue?" "In front of the bear statue" "Behind the bear statue" "To the left of the bear statue" "To the right of the bear statue" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/422.jpg" +"423" "D" "What is the position of the totem pole in relation to the bear statue?" "To the right of the bear statue" "Behind the bear statue" "In front of the bear statue" "To the left of the bear statue" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/423.jpg" +"424" "A" "What is the direction of the overhead electric wires in relation to the train?" "Parallel to the train" "Perpendicular to the train" "Diagonal to the train" "Curved above the train" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/424.jpg" +"425" "B" "What is the direction of the overhead electric wires in relation to the train?" "Perpendicular to the train" "Parallel to the train" "Curved above the train" "Diagonal to the train" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/425.jpg" +"426" "C" "What is the direction of the overhead electric wires in relation to the train?" "Diagonal to the train" "Curved above the train" "Parallel to the train" "Perpendicular to the train" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/426.jpg" +"427" "D" "What is the direction of the overhead electric wires in relation to the train?" "Curved above the train" "Perpendicular to the train" "Diagonal to the train" "Parallel to the train" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/427.jpg" +"428" "A" "What is the relative position of the person in the red jacket compared to the large tree?" "To the right of the large tree" "In front of the large tree" "To the left of the large tree" "Behind the large tree" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/428.jpg" +"429" "B" "What is the relative position of the person in the red jacket compared to the large tree?" "Behind the large tree" "To the right of the large tree" "In front of the large tree" "To the left of the large tree" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/429.jpg" +"430" "C" "What is the relative position of the person in the red jacket compared to the large tree?" "In front of the large tree" "Behind the large tree" "To the right of the large tree" "To the left of the large tree" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/430.jpg" +"431" "D" "What is the relative position of the person in the red jacket compared to the large tree?" "Behind the large tree" "In front of the large tree" "To the left of the large tree" "To the right of the large tree" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/431.jpg" +"432" "A" "What type of structure is visible to the right of the image?" "An elephant statue" "A car" "A bridge" "A house" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/432.jpg" +"433" "B" "What type of structure is visible to the right of the image?" "A house" "An elephant statue" "A bridge" "A car" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/433.jpg" +"434" "C" "What type of structure is visible to the right of the image?" "A car" "A bridge" "An elephant statue" "A house" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/434.jpg" +"435" "D" "What type of structure is visible to the right of the image?" "A bridge" "A house" "A car" "An elephant statue" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/435.jpg" +"436" "A" "How many people are standing in front of the entrance of the building?" "Four" "Two" "Five" "Three" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/436.jpg" +"437" "B" "How many people are standing in front of the entrance of the building?" "Five" "Four" "Three" "Two" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/437.jpg" +"438" "C" "How many people are standing in front of the entrance of the building?" "Three" "Two" "Four" "Five" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/438.jpg" +"439" "D" "How many people are standing in front of the entrance of the building?" "Three" "Five" "Two" "Four" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/439.jpg" +"440" "A" "Which tower is closer to the viewer, the left tower or the right tower?" "The left tower" "Both are equisdistant" "The right tower" "No tower here" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/440.jpg" +"441" "B" "Which tower is closer to the viewer, the left tower or the right tower?" "Both are equisdistant" "The left tower" "The right tower" "No tower here" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/441.jpg" +"442" "C" "Which tower is closer to the viewer, the left tower or the right tower?" "The right tower" "No tower here" "The left tower" "Both are equisdistant" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/442.jpg" +"443" "D" "Which tower is closer to the viewer, the left tower or the right tower?" "No tower here" "The right tower" "Both are equisdistant" "The left tower" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/443.jpg" +"444" "A" "What is the building behind the statue?" "District of Columbia Court of Appeals" "White House" "Supreme Court" "Capitol Building" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/444.jpg" +"445" "B" "What is the building behind the statue?" "Capitol Building" "District of Columbia Court of Appeals" "White House" "Supreme Court" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/445.jpg" +"446" "C" "What is the building behind the statue?" "Capitol Building" "Supreme Court" "District of Columbia Court of Appeals" "White House" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/446.jpg" +"447" "D" "What is the building behind the statue?" "White House" "Capitol Building" "Supreme Court" "District of Columbia Court of Appeals" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/447.jpg" +"448" "A" "Where is the statue located in the image?" "The statue is located on the right side of the image" "The statue is located inside the colonnade" "The statue is located in the center of the colonnade" "The statue is located on the left side of the image" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/448.jpg" +"449" "B" "Where is the statue located in the image?" "The statue is located in the center of the colonnade" "The statue is located on the right side of the image" "The statue is located on the left side of the image" "The statue is located inside the colonnade" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/449.jpg" +"450" "C" "Where is the statue located in the image?" "The statue is located on the left side of the image" "The statue is located inside the colonnade" "The statue is located on the right side of the image" "The statue is located in the center of the colonnade" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/450.jpg" +"451" "D" "Where is the statue located in the image?" "The statue is located inside the colonnade" "The statue is located on the left side of the image" "The statue is located in the center of the colonnade" "The statue is located on the right side of the image" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/451.jpg" +"452" "A" "What is the object directly to the right of the main entrance of the church?" "A statue of a saint" "A lamp post" "A window" "A dog" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/452.jpg" +"453" "B" "What is the object directly to the right of the main entrance of the church?" "A dog" "A statue of a saint" "A lamp post" "A window" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/453.jpg" +"454" "C" "What is the object directly to the right of the main entrance of the church?" "A window" "A lamp post" "A statue of a saint" "A dog" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/454.jpg" +"455" "D" "What is the object directly to the right of the main entrance of the church?" "A window" "A lamp post" "A dog" "A statue of a saint" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/455.jpg" +"456" "A" "In which direction is the child in the foreground running on the bridge?" "Away from the camera" "Towards the camera" "No child in the image" "Sideways" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/456.jpg" +"457" "B" "In which direction is the child in the foreground running on the bridge?" "Sideways" "Away from the camera" "Towards the camera" "No child in the image" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/457.jpg" +"458" "C" "In which direction is the child in the foreground running on the bridge?" "Sideways" "No child in the image" "Away from the camera" "Towards the camera" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/458.jpg" +"459" "D" "In which direction is the child in the foreground running on the bridge?" "No child in the image" "Towards the camera" "Sideways" "Away from the camera" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/459.jpg" +"460" "A" "What is the relative position of the person compared to the building?" "The person is located to the right of the building" "The person is in front of the building" "No person in the image" "The person is located to the left of the building" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/460.jpg" +"461" "B" "What is the relative position of the person compared to the building?" "The person is in front of the building" "The person is located to the right of the building" "No person in the image" "The person is located to the left of the building" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/461.jpg" +"462" "C" "What is the relative position of the person compared to the building?" "The person is in front of the building" "No person in the image" "The person is located to the right of the building" "The person is located to the left of the building" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/462.jpg" +"463" "D" "What is the relative position of the person compared to the building?" "The person is in front of the building" "No person in the image" "The person is located to the left of the building" "The person is located to the right of the building" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/463.jpg" +"464" "A" "What is located to the right of the main house in the image?" "A smaller building" "A boat" "A car" "A large tree" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/464.jpg" +"465" "B" "What is located to the right of the main house in the image?" "A boat" "A smaller building" "A car" "A large tree" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/465.jpg" +"466" "C" "What is located to the right of the main house in the image?" "A boat" "A large tree" "A smaller building" "A car" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/466.jpg" +"467" "D" "What is located to the right of the main house in the image?" "A large tree" "A car" "A boat" "A smaller building" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/467.jpg" +"468" "A" "Where is the clock located in the room?" "On the wall to the right of the main seating area" "No clock in the room" "Above the main seating area" "On the wall to the left of the main seating area" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/468.jpg" +"469" "B" "Where is the clock located in the room?" "No clock in the room" "On the wall to the right of the main seating area" "On the wall to the left of the main seating area" "Above the main seating area" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/469.jpg" +"470" "C" "Where is the clock located in the room?" "Above the main seating area" "No clock in the room" "On the wall to the right of the main seating area" "On the wall to the left of the main seating area" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/470.jpg" +"471" "D" "Where is the clock located in the room?" "No clock in the room" "On the wall to the left of the main seating area" "Above the main seating area" "On the wall to the right of the main seating area" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/471.jpg" +"472" "A" "What is the relative position of the component labeled ""Sony"" compared to the component labeled ""Mavica""?" "Right" "Left" "Above" "Behind" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/472.jpg" +"473" "B" "What is the relative position of the component labeled ""Sony"" compared to the component labeled ""Mavica""?" "Behind" "Right" "Left" "Above" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/473.jpg" +"474" "C" "What is the relative position of the component labeled ""Sony"" compared to the component labeled ""Mavica""?" "Left" "Behind" "Right" "Above" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/474.jpg" +"475" "D" "What is the relative position of the component labeled ""Sony"" compared to the component labeled ""Mavica""?" "Behind" "Above" "Left" "Right" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/475.jpg" +"476" "A" "What is written on the parachute?" "SWING" "SWOOP" "SPRING" "SWIRL" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/476.jpg" +"477" "B" "What is written on the parachute?" "SWOOP" "SWING" "SPRING" "SWIRL" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/477.jpg" +"478" "C" "What is written on the parachute?" "SWIRL" "SPRING" "SWING" "SWOOP" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/478.jpg" +"479" "D" "What is written on the parachute?" "SPRING" "SWOOP" "SWIRL" "SWING" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/479.jpg" +"480" "A" "What is written on the parachute?" "SWIRL" "SWING" "SWOOP" "SPRING" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/480.jpg" +"481" "B" "What is written on the parachute?" "SPRING" "SWIRL" "SWING" "SWOOP" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/481.jpg" +"482" "C" "What is written on the parachute?" "SWING" "SWOOP" "SWIRL" "SPRING" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/482.jpg" +"483" "D" "What is written on the parachute?" "SPRING" "SWING" "SWOOP" "SWIRL" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/483.jpg" +"484" "A" "What is written on the parachute?" "SWOOP" "SWING" "SPRING" "SWIRL" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/484.jpg" +"485" "B" "What is written on the parachute?" "SWIRL" "SWOOP" "SWING" "SPRING" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/485.jpg" +"486" "C" "What is written on the parachute?" "SWIRL" "SWING" "SWOOP" "SPRING" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/486.jpg" +"487" "D" "What is written on the parachute?" "SWING" "SWIRL" "SPRING" "SWOOP" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/487.jpg" +"488" "A" "What is written on the parachute?" "SPRING" "SWIRL" "SWING" "SWOOP" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/488.jpg" +"489" "B" "What is written on the parachute?" "SWOOP" "SPRING" "SWIRL" "SWING" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/489.jpg" +"490" "C" "What is written on the parachute?" "SWIRL" "SWING" "SPRING" "SWOOP" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/490.jpg" +"491" "D" "What is written on the parachute?" "SWIRL" "SWOOP" "SWING" "SPRING" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/491.jpg" +"492" "A" "What word is visible on the suitcase?" "Dally" "Daily" "Rally" "Dolly" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/492.jpg" +"493" "B" "What word is visible on the suitcase?" "Dolly" "Dally" "Rally" "Daily" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/493.jpg" +"494" "C" "What word is visible on the suitcase?" "Dolly" "Daily" "Dally" "Rally" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/494.jpg" +"495" "D" "What word is visible on the suitcase?" "Daily" "Dolly" "Rally" "Dally" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/495.jpg" +"496" "A" "What word is visible on the suitcase?" "Dolly" "Rally" "Daily" "Dally" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/496.jpg" +"497" "B" "What word is visible on the suitcase?" "Rally" "Dolly" "Dally" "Daily" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/497.jpg" +"498" "C" "What word is visible on the suitcase?" "Dally" "Daily" "Dolly" "Rally" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/498.jpg" +"499" "D" "What word is visible on the suitcase?" "Rally" "Daily" "Dally" "Dolly" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/499.jpg" +"500" "A" "What word is written on the hang glider?" "Windy" "Cloudy" "Stormy" "Sunny" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/500.jpg" +"501" "B" "What word is written on the hang glider?" "Cloudy" "Windy" "Sunny" "Stormy" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/501.jpg" +"502" "C" "What word is written on the hang glider?" "Sunny" "Cloudy" "Windy" "Stormy" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/502.jpg" +"503" "D" "What word is written on the hang glider?" "Stormy" "Sunny" "Cloudy" "Windy" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/503.jpg" +"504" "A" "What word is written on the hang glider?" "Cloudy" "Windy" "Sunny" "Stormy" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/504.jpg" +"505" "B" "What word is written on the hang glider?" "Windy" "Cloudy" "Sunny" "Stormy" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/505.jpg" +"506" "C" "What word is written on the hang glider?" "Windy" "Stormy" "Cloudy" "Sunny" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/506.jpg" +"507" "D" "What word is written on the hang glider?" "Sunny" "Stormy" "Windy" "Cloudy" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/507.jpg" +"508" "A" "What word is written on the hang glider?" "Sunny" "Windy" "Cloudy" "Stormy" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/508.jpg" +"509" "B" "What word is written on the hang glider?" "Windy" "Sunny" "Cloudy" "Stormy" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/509.jpg" +"510" "C" "What word is written on the hang glider?" "Windy" "Cloudy" "Sunny" "Stormy" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/510.jpg" +"511" "D" "What word is written on the hang glider?" "Cloudy" "Windy" "Stormy" "Sunny" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/511.jpg" +"512" "A" "What word is written on the hang glider?" "Stormy" "Sunny" "Windy" "Cloudy" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/512.jpg" +"513" "B" "What word is written on the hang glider?" "Windy" "Stormy" "Cloudy" "Sunny" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/513.jpg" +"514" "C" "What word is written on the hang glider?" "Cloudy" "Sunny" "Stormy" "Windy" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/514.jpg" +"515" "D" "What word is written on the hang glider?" "Sunny" "Windy" "Cloudy" "Stormy" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/515.jpg" +"516" "A" "What is the license plate number of the car?" "217722-ROMA" "217722-ROM" "21722-ROMA" "217722-RMA" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/516.jpg" +"517" "B" "What is the license plate number of the car?" "217722-RMA" "217722-ROMA" "21722-ROMA" "217722-ROM" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/517.jpg" +"518" "C" "What is the license plate number of the car?" "217722-RMA" "21722-ROMA" "217722-ROMA" "217722-ROM" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/518.jpg" +"519" "D" "What is the license plate number of the car?" "21722-ROMA" "217722-ROM" "217722-RMA" "217722-ROMA" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/519.jpg" +"520" "A" "Where is the bird positioned in relation to the car?" "To the left side on the ground in front of the car" "To the right side of the car" "Behind the car" "On top of the car" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/520.jpg" +"521" "B" "Where is the bird positioned in relation to the car?" "Behind the car" "To the left side on the ground in front of the car" "To the right side of the car" "On top of the car" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/521.jpg" +"522" "C" "Where is the bird positioned in relation to the car?" "On top of the car" "Behind the car" "To the left side on the ground in front of the car" "To the right side of the car" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/522.jpg" +"523" "D" "Where is the bird positioned in relation to the car?" "On top of the car" "Behind the car" "To the right side of the car" "To the left side on the ground in front of the car" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/523.jpg" +"524" "A" "What is written inside the red rectangle on the sign?" "Muzium Tekstil Negara, National Textile Museum" "Muzium Tekstil Negara, National Music Museum" "Muzium Kebudayaan Negara, National Culture Museum" "Muzium Kesenian Negara, National Art Museum" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/524.jpg" +"525" "B" "What is written inside the red rectangle on the sign?" "Muzium Kebudayaan Negara, National Culture Museum" "Muzium Tekstil Negara, National Textile Museum" "Muzium Tekstil Negara, National Music Museum" "Muzium Kesenian Negara, National Art Museum" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/525.jpg" +"526" "C" "What is written inside the red rectangle on the sign?" "Muzium Kesenian Negara, National Art Museum" "Muzium Tekstil Negara, National Music Museum" "Muzium Tekstil Negara, National Textile Museum" "Muzium Kebudayaan Negara, National Culture Museum" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/526.jpg" +"527" "D" "What is written inside the red rectangle on the sign?" "Muzium Kebudayaan Negara, National Culture Museum" "Muzium Kesenian Negara, National Art Museum" "Muzium Tekstil Negara, National Music Museum" "Muzium Tekstil Negara, National Textile Museum" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/527.jpg" +"528" "A" "What is written inside the red rectangle on the sign?" "AGRO BANK" "AGRA BANK" "AGRC BANK" "AGRT BANK" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/528.jpg" +"529" "B" "What is written inside the red rectangle on the sign?" "AGRC BANK" "AGRO BANK" "AGRA BANK" "AGRT BANK" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/529.jpg" +"530" "C" "What is written inside the red rectangle on the sign?" "AGRC BANK" "AGRT BANK" "AGRO BANK" "AGRA BANK" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/530.jpg" +"531" "D" "What is written inside the red rectangle on the sign?" "AGRT BANK" "AGRA BANK" "AGRC BANK" "AGRO BANK" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/531.jpg" +"532" "A" "Which direction is the taller white building in relation to the National Textile Museum?" "Right" "Above" "Left" "Behind" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/532.jpg" +"533" "B" "Which direction is the taller white building in relation to the National Textile Museum?" "Above" "Right" "Behind" "Left" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/533.jpg" +"534" "C" "Which direction is the taller white building in relation to the National Textile Museum?" "Left" "Behind" "Right" "Above" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/534.jpg" +"535" "D" "Which direction is the taller white building in relation to the National Textile Museum?" "Behind" "Left" "Above" "Right" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/535.jpg" +"536" "A" "What word is written on the building to the left in the image?" "family" "house" "five" "office" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/536.jpg" +"537" "B" "What word is written on the building to the left in the image?" "office" "family" "five" "house" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/537.jpg" +"538" "C" "What word is written on the building to the left in the image?" "house" "office" "family" "five" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/538.jpg" +"539" "D" "What word is written on the building to the left in the image?" "office" "house" "five" "family" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/539.jpg" +"540" "A" "What color is the car located to the right of the orange car in the image?" "Yellow" "Black" "Red" "Blue" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/540.jpg" +"541" "B" "What color is the car located to the right of the orange car in the image?" "Red" "Yellow" "Black" "Blue" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/541.jpg" +"542" "C" "What color is the car located to the right of the orange car in the image?" "Red" "Black" "Yellow" "Blue" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/542.jpg" +"543" "D" "What color is the car located to the right of the orange car in the image?" "Red" "Black" "Blue" "Yellow" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/543.jpg" +"544" "A" "What is the object placed directly in front of the bench on the left side of the image?" "bicycle" "trash can" "car" "scooter" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/544.jpg" +"545" "B" "What is the object placed directly in front of the bench on the left side of the image?" "car" "bicycle" "scooter" "trash can" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/545.jpg" +"546" "C" "What is the object placed directly in front of the bench on the left side of the image?" "scooter" "car" "bicycle" "trash can" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/546.jpg" +"547" "D" "What is the object placed directly in front of the bench on the left side of the image?" "scooter" "trash can" "car" "bicycle" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/547.jpg" +"548" "A" "How many people are seated at the table on the right side of the image where a woman in a striped shirt is standing?" "Three people" "Five people" "Two people" "Four people" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/548.jpg" +"549" "B" "How many people are seated at the table on the right side of the image where a woman in a striped shirt is standing?" "Two people" "Three people" "Five people" "Four people" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/549.jpg" +"550" "C" "How many people are seated at the table on the right side of the image where a woman in a striped shirt is standing?" "Two people" "Five people" "Three people" "Four people" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/550.jpg" +"551" "D" "How many people are seated at the table on the right side of the image where a woman in a striped shirt is standing?" "Two people" "Four people" "Five people" "Three people" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/551.jpg" +"552" "A" "What object can be seen inside the partially built brick structure?" "A wooden box with flowers" "A dog" "A metal chair" "A plastic bag" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/552.jpg" +"553" "B" "What object can be seen inside the partially built brick structure?" "A plastic bag" "A wooden box with flowers" "A metal chair" "A dog" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/553.jpg" +"554" "C" "What object can be seen inside the partially built brick structure?" "A plastic bag" "A metal chair" "A wooden box with flowers" "A dog" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/554.jpg" +"555" "D" "What object can be seen inside the partially built brick structure?" "A plastic bag" "A dog" "A metal chair" "A wooden box with flowers" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/555.jpg" +"556" "A" "What is the position of the chair relative to the bicycles?" "To the left of the bicycles" "In front of the bicycles" "Behind the bicycles" "To the right of the bicycles" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/556.jpg" +"557" "B" "What is the position of the chair relative to the bicycles?" "In front of the bicycles" "To the left of the bicycles" "To the right of the bicycles" "Behind the bicycles" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/557.jpg" +"558" "C" "What is the position of the chair relative to the bicycles?" "To the right of the bicycles" "In front of the bicycles" "To the left of the bicycles" "Behind the bicycles" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/558.jpg" +"559" "D" "What is the position of the chair relative to the bicycles?" "To the right of the bicycles" "Behind the bicycles" "In front of the bicycles" "To the left of the bicycles" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/559.jpg" +"560" "A" "How many bicycles are visible near the building's entrance?" "Three" "One" "Four" "Two" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/560.jpg" +"561" "B" "How many bicycles are visible near the building's entrance?" "Two" "Three" "Four" "One" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/561.jpg" +"562" "C" "How many bicycles are visible near the building's entrance?" "Two" "Four" "Three" "One" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/562.jpg" +"563" "D" "How many bicycles are visible near the building's entrance?" "Four" "One" "Two" "Three" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/563.jpg" +"564" "A" "What is the position of the car relative to the statue of lion?" "To the left behind of statue of lion" "Behind the statue of lion" "To the right behind of statue of lion" "In front of the statue of lion" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/564.jpg" +"565" "B" "What is the position of the car relative to the statue of lion?" "In front of the statue of lion" "To the left behind of statue of lion" "To the right behind of statue of lion" "Behind the statue of lion" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/565.jpg" +"566" "C" "What is the position of the car relative to the statue of lion?" "To the right behind of statue of lion" "In front of the statue of lion" "To the left behind of statue of lion" "Behind the statue of lion" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/566.jpg" +"567" "D" "What is the position of the car relative to the statue of lion?" "Behind the statue of lion" "In front of the statue of lion" "To the right behind of statue of lion" "To the left behind of statue of lion" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/567.jpg" +"568" "A" "What is the position of the car relative to the central tower of the building?" "Left" "In front of the building" "Behind the building" "Right" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/568.jpg" +"569" "B" "What is the position of the car relative to the central tower of the building?" "Behind the building" "Left" "Right" "In front of the building" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/569.jpg" +"570" "C" "What is the position of the car relative to the central tower of the building?" "Right" "Behind the building" "Left" "In front of the building" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/570.jpg" +"571" "D" "What is the position of the car relative to the central tower of the building?" "Behind the building" "Right" "In front of the building" "Left" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/571.jpg" +"572" "A" "What is the primary function of the object in the red circle?" "To hold and dispense water for drinking" "To store chemicals for laboratory use" "To serve as a container for cooking oil" "To be used as a decorative item" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/572.jpg" +"573" "B" "What is the primary function of the object in the red circle?" "To store chemicals for laboratory use" "To hold and dispense water for drinking" "To be used as a decorative item" "To serve as a container for cooking oil" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/573.jpg" +"574" "C" "What is the primary function of the object in the red circle?" "To store chemicals for laboratory use" "To be used as a decorative item" "To hold and dispense water for drinking" "To serve as a container for cooking oil" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/574.jpg" +"575" "D" "What is the primary function of the object in the red circle?" "To serve as a container for cooking oil" "To store chemicals for laboratory use" "To be used as a decorative item" "To hold and dispense water for drinking" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/575.jpg" +"576" "A" "What is the purpose of the label in the red circle?" "The label indicates that consumers can get a refund of 10 cents if they return the bottle to a recycling center in California" "The label indicates a special tax that applies only to this brand of water in California" "The label indicates that the bottle costs an extra 10 cents in California" "The label is a discount coupon for purchasing the bottle" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/576.jpg" +"577" "B" "What is the purpose of the label in the red circle?" "The label indicates that the bottle costs an extra 10 cents in California" "The label indicates that consumers can get a refund of 10 cents if they return the bottle to a recycling center in California" "The label is a discount coupon for purchasing the bottle" "The label indicates a special tax that applies only to this brand of water in California" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/577.jpg" +"578" "C" "What is the purpose of the label in the red circle?" "The label indicates that the bottle costs an extra 10 cents in California" "The label is a discount coupon for purchasing the bottle" "The label indicates that consumers can get a refund of 10 cents if they return the bottle to a recycling center in California" "The label indicates a special tax that applies only to this brand of water in California" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/578.jpg" +"579" "D" "What is the purpose of the label in the red circle?" "The label is a discount coupon for purchasing the bottle" "The label indicates that the bottle costs an extra 10 cents in California" "The label indicates a special tax that applies only to this brand of water in California" "The label indicates that consumers can get a refund of 10 cents if they return the bottle to a recycling center in California" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/579.jpg" +"580" "A" "What does the label in the red circle signify?" "The manufacturer assures the quality of the product and may offer a refund or relpacement if the consumer is not satisfied" "The label guarantees that the bottle will not leak" "The label indicates that the water is 100% pure with no additives" "The bottle is made from 100% recycled materials" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/580.jpg" +"581" "B" "What does the label in the red circle signify?" "The bottle is made from 100% recycled materials" "The manufacturer assures the quality of the product and may offer a refund or relpacement if the consumer is not satisfied" "The label guarantees that the bottle will not leak" "The label indicates that the water is 100% pure with no additives" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/581.jpg" +"582" "C" "What does the label in the red circle signify?" "The bottle is made from 100% recycled materials" "The label guarantees that the bottle will not leak" "The manufacturer assures the quality of the product and may offer a refund or relpacement if the consumer is not satisfied" "The label indicates that the water is 100% pure with no additives" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/582.jpg" +"583" "D" "What does the label in the red circle signify?" "The bottle is made from 100% recycled materials" "The label guarantees that the bottle will not leak" "The label indicates that the water is 100% pure with no additives" "The manufacturer assures the quality of the product and may offer a refund or relpacement if the consumer is not satisfied" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/583.jpg" +"584" "A" "What does the Chinese text in the red rectangle translate to in English?" "Tong Fuk Nam Trading" "Dragon Street Bazaar" "Happy Fortune Shop" "Hong Kong Market" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/584.jpg" +"585" "B" "What does the Chinese text in the red rectangle translate to in English?" "Hong Kong Market" "Tong Fuk Nam Trading" "Happy Fortune Shop" "Dragon Street Bazaar" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/585.jpg" +"586" "C" "What does the Chinese text in the red rectangle translate to in English?" "Happy Fortune Shop" "Hong Kong Market" "Tong Fuk Nam Trading" "Dragon Street Bazaar" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/586.jpg" +"587" "D" "What does the Chinese text in the red rectangle translate to in English?" "Hong Kong Market" "Dragon Street Bazaar" "Happy Fortune Shop" "Tong Fuk Nam Trading" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/587.jpg" +"588" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 4" "Locations 2 and 3" "Locations 1 and 2" "Locations 3 and 4" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/588.jpg" +"589" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 4" "Locations 1 and 2" "Locations 3 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/589.jpg" +"590" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 3 and 4" "Locations 1 and 4" "Locations 1 and 2" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/590.jpg" +"591" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 3 and 4" "Locations 2 and 3" "Locations 1 and 4" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/591.jpg" +"592" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 2 and 4" "Locations 3 and 4" "Locations 1 and 4" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/592.jpg" +"593" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 2" "Locations 1 and 4" "Locations 3 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/593.jpg" +"594" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 3 and 4" "Locations 2 and 4" "Locations 1 and 2" "Locations 1 and 4" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/594.jpg" +"595" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 3 and 4" "Locations 1 and 4" "Locations 1 and 2" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/595.jpg" +"596" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 3 and 4" "Locations 1 and 4" "Locations 2 and 4" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/596.jpg" +"597" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 3 and 4" "Locations 1 and 2" "Locations 2 and 4" "Locations 1 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/597.jpg" +"598" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 3 and 4" "Locations 2 and 4" "Locations 1 and 2" "Locations 1 and 4" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/598.jpg" +"599" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 4" "Locations 3 and 4" "Locations 2 and 4" "Locations 1 and 2" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/599.jpg" +"600" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 4" "Locations 2 and 3" "Locations 1 and 2" "Locations 3 and 4" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/600.jpg" +"601" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 1 and 4" "Locations 2 and 3" "Locations 3 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/601.jpg" +"602" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 3 and 4" "Locations 2 and 3" "Locations 1 and 4" "Locations 1 and 2" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/602.jpg" +"603" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 3 and 4" "Locations 1 and 2" "Locations 1 and 4" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/603.jpg" +"604" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 2 and 3" "Locations 2 and 4" "Locations 1 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/604.jpg" +"605" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 2" "Locations 2 and 4" "Locations 1 and 3" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/605.jpg" +"606" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 3" "Locations 2 and 3" "Locations 1 and 2" "Locations 2 and 4" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/606.jpg" +"607" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 3" "Locations 2 and 4" "Locations 1 and 2" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/607.jpg" +"608" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 2 and 4" "Locations 2 and 3" "Locations 1 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/608.jpg" +"609" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 2" "Locations 1 and 3" "Locations 2 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/609.jpg" +"610" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 3" "Locations 1 and 2" "Locations 2 and 3" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/610.jpg" +"611" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 3" "Locations 2 and 4" "Locations 1 and 2" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/611.jpg" +"612" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 2 and 4" "Locations 1 and 3" "Locations 2 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/612.jpg" +"613" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 2" "Locations 2 and 3" "Locations 1 and 3" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/613.jpg" +"614" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 2 and 3" "Locations 1 and 2" "Locations 1 and 3" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/614.jpg" +"615" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 3" "Locations 2 and 3" "Locations 1 and 2" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/615.jpg" +"616" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 4" "Locations 1 and 3" "Locations 2 and 4" "Locations 2 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/616.jpg" +"617" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 3" "Locations 1 and 4" "Locations 2 and 4" "Locations 2 and 3" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/617.jpg" +"618" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 2 and 4" "Locations 1 and 4" "Locations 1 and 3" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/618.jpg" +"619" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 2 and 3" "Locations 1 and 3" "Locations 1 and 4" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/619.jpg" +"620" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 4" "Locations 1 and 3" "Locations 2 and 4" "Locations 1 and 2" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/620.jpg" +"621" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 1 and 4" "Locations 1 and 3" "Locations 2 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/621.jpg" +"622" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 2" "Locations 1 and 4" "Locations 1 and 3" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/622.jpg" +"623" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 3" "Locations 1 and 2" "Locations 2 and 4" "Locations 1 and 4" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/623.jpg" +"624" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 2 and 4" "Locations 2 and 3" "Locations 1 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/624.jpg" +"625" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 3" "Locations 1 and 2" "Locations 2 and 3" "Locations 2 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/625.jpg" +"626" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 3" "Locations 1 and 2" "Locations 2 and 4" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/626.jpg" +"627" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 2 and 3" "Locations 1 and 3" "Locations 1 and 2" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/627.jpg" +"628" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 3" "Locations 2 and 4" "Locations 1 and 2" "Locations 2 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/628.jpg" +"629" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 2" "Locations 1 and 3" "Locations 2 and 4" "Locations 2 and 3" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/629.jpg" +"630" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 2" "Locations 1 and 3" "Locations 2 and 4" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/630.jpg" +"631" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 2" "Locations 2 and 3" "Locations 1 and 3" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/631.jpg" +"632" "A" "On the provided map, which two numbered locations belong to the same country?" "Locations 1 and 3" "Locations 2 and 4" "Locations 1 and 4" "Locations 2 and 3" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/632.jpg" +"633" "B" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 4" "Locations 1 and 3" "Locations 2 and 3" "Locations 1 and 4" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/633.jpg" +"634" "C" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 4" "Locations 1 and 3" "Locations 2 and 4" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/634.jpg" +"635" "D" "On the provided map, which two numbered locations belong to the same country?" "Locations 2 and 3" "Locations 1 and 4" "Locations 2 and 4" "Locations 1 and 3" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/635.jpg" +"636" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Abraham Lincoln" "Theodore Roosevelt" "Thomas Jefferson" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/636.jpg" +"637" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "George Washington" "Theodore Roosevelt" "Abraham Lincoln" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/637.jpg" +"638" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "George Washington" "Theodore Roosevelt" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/638.jpg" +"639" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Abraham Lincoln" "Thomas Jefferson" "Theodore Roosevelt" "George Washington" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/639.jpg" +"640" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "George Washington" "Theodore Roosevelt" "Abraham Lincoln" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/640.jpg" +"641" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Abraham Lincoln" "Thomas Jefferson" "Theodore Roosevelt" "George Washington" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/641.jpg" +"642" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Abraham Lincoln" "Thomas Jefferson" "Theodore Roosevelt" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/642.jpg" +"643" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "George Washington" "Abraham Lincoln" "Thomas Jefferson" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/643.jpg" +"644" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "Thomas Jefferson" "George Washington" "Abraham Lincoln" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/644.jpg" +"645" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Theodore Roosevelt" "George Washington" "Abraham Lincoln" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/645.jpg" +"646" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "Theodore Roosevelt" "George Washington" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/646.jpg" +"647" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Thomas Jefferson" "Abraham Lincoln" "Theodore Roosevelt" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/647.jpg" +"648" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Abraham Lincoln" "George Washington" "Thomas Jefferson" "Theodore Roosevelt" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/648.jpg" +"649" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "George Washington" "Theodore Roosevelt" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/649.jpg" +"650" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "George Washington" "Abraham Lincoln" "Thomas Jefferson" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/650.jpg" +"651" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "George Washington" "Theodore Roosevelt" "Abraham Lincoln" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/651.jpg" +"652" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Thomas Jefferson" "Theodore Roosevelt" "Abraham Lincoln" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/652.jpg" +"653" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "George Washington" "Thomas Jefferson" "Abraham Lincoln" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/653.jpg" +"654" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "George Washington" "Theodore Roosevelt" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/654.jpg" +"655" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "Abraham Lincoln" "Thomas Jefferson" "George Washington" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/655.jpg" +"656" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Theodore Roosevelt" "Abraham Lincoln" "George Washington" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/656.jpg" +"657" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Thomas Jefferson" "Abraham Lincoln" "Theodore Roosevelt" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/657.jpg" +"658" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "Abraham Lincoln" "Thomas Jefferson" "George Washington" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/658.jpg" +"659" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "Abraham Lincoln" "George Washington" "Thomas Jefferson" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/659.jpg" +"660" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Theodore Roosevelt" "Abraham Lincoln" "George Washington" "Thomas Jefferson" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/660.jpg" +"661" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Abraham Lincoln" "Theodore Roosevelt" "Thomas Jefferson" "George Washington" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/661.jpg" +"662" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "Theodore Roosevelt" "George Washington" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/662.jpg" +"663" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "George Washington" "Theodore Roosevelt" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/663.jpg" +"664" "A" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Abraham Lincoln" "Thomas Jefferson" "Theodore Roosevelt" "George Washington" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/664.jpg" +"665" "B" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "Thomas Jefferson" "Abraham Lincoln" "George Washington" "Theodore Roosevelt" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/665.jpg" +"666" "C" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Theodore Roosevelt" "Abraham Lincoln" "Thomas Jefferson" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/666.jpg" +"667" "D" "Which president's face is highlighted in the red rectangle on Mount Rushmore?" "George Washington" "Thomas Jefferson" "Theodore Roosevelt" "Abraham Lincoln" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/667.jpg" +"668" "A" "What is the sum of the sales for Item 1 and Item 6?" "97" "96" "94" "95" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/668.jpg" +"669" "B" "What is the sum of the sales for Item 1 and Item 6?" "95" "97" "96" "94" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/669.jpg" +"670" "C" "What is the sum of the sales for Item 1 and Item 6?" "94" "96" "97" "95" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/670.jpg" +"671" "D" "What is the sum of the sales for Item 1 and Item 6?" "96" "95" "94" "97" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/671.jpg" +"672" "A" "What is the average sales of Item 10 and Item 15?" "6" "15" "9" "12" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/672.jpg" +"673" "B" "What is the average sales of Item 10 and Item 15?" "9" "6" "15" "12" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/673.jpg" +"674" "C" "What is the average sales of Item 10 and Item 15?" "9" "12" "6" "15" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/674.jpg" +"675" "D" "What is the average sales of Item 10 and Item 15?" "12" "15" "9" "6" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/675.jpg" +"676" "A" "What is the sum of the sales for Item 1 and Item 6?" "97" "94" "95" "96" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/676.jpg" +"677" "B" "What is the sum of the sales for Item 1 and Item 6?" "95" "97" "96" "94" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/677.jpg" +"678" "C" "What is the sum of the sales for Item 1 and Item 6?" "96" "94" "97" "95" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/678.jpg" +"679" "D" "What is the sum of the sales for Item 1 and Item 6?" "95" "96" "94" "97" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/679.jpg" +"680" "A" "What is the average sales of Item 10 and Item 15?" "6" "12" "15" "9" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/680.jpg" +"681" "B" "What is the average sales of Item 10 and Item 15?" "9" "6" "12" "15" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/681.jpg" +"682" "C" "What is the average sales of Item 10 and Item 15?" "15" "12" "6" "9" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/682.jpg" +"683" "D" "What is the average sales of Item 10 and Item 15?" "15" "12" "9" "6" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/683.jpg" +"684" "A" "What is the sum of the sales for Item 1 and Item 6?" "97" "95" "94" "96" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/684.jpg" +"685" "B" "What is the sum of the sales for Item 1 and Item 6?" "96" "97" "94" "95" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/685.jpg" +"686" "C" "What is the sum of the sales for Item 1 and Item 6?" "94" "96" "97" "95" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/686.jpg" +"687" "D" "What is the sum of the sales for Item 1 and Item 6?" "96" "95" "94" "97" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/687.jpg" +"688" "A" "What is the average sales of Item 10 and Item 15?" "6" "12" "9" "15" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/688.jpg" +"689" "B" "What is the average sales of Item 10 and Item 15?" "15" "6" "12" "9" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/689.jpg" +"690" "C" "What is the average sales of Item 10 and Item 15?" "12" "15" "6" "9" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/690.jpg" +"691" "D" "What is the average sales of Item 10 and Item 15?" "15" "9" "12" "6" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/691.jpg" +"692" "A" "What is the sum of the sales for Item 1 and Item 6?" "97" "94" "95" "96" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/692.jpg" +"693" "B" "What is the sum of the sales for Item 1 and Item 6?" "95" "97" "94" "96" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/693.jpg" +"694" "C" "What is the sum of the sales for Item 1 and Item 6?" "95" "94" "97" "96" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/694.jpg" +"695" "D" "What is the sum of the sales for Item 1 and Item 6?" "96" "94" "95" "97" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/695.jpg" +"696" "A" "What is the average sales of Item 10 and Item 15?" "6" "15" "9" "12" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/696.jpg" +"697" "B" "What is the average sales of Item 10 and Item 15?" "9" "6" "12" "15" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/697.jpg" +"698" "C" "What is the average sales of Item 10 and Item 15?" "12" "15" "6" "9" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/698.jpg" +"699" "D" "What is the average sales of Item 10 and Item 15?" "15" "9" "12" "6" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/699.jpg" +"700" "A" "What is the sum of the sales for Item 1 and Item 6?" "97" "96" "95" "94" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/700.jpg" +"701" "B" "What is the sum of the sales for Item 1 and Item 6?" "96" "97" "94" "95" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/701.jpg" +"702" "C" "What is the sum of the sales for Item 1 and Item 6?" "96" "94" "97" "95" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/702.jpg" +"703" "D" "What is the sum of the sales for Item 1 and Item 6?" "96" "94" "95" "97" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/703.jpg" +"704" "A" "What is the average sales of Item 10 and Item 15?" "6" "9" "15" "12" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/704.jpg" +"705" "B" "What is the average sales of Item 10 and Item 15?" "9" "6" "15" "12" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/705.jpg" +"706" "C" "What is the average sales of Item 10 and Item 15?" "15" "9" "6" "12" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/706.jpg" +"707" "D" "What is the average sales of Item 10 and Item 15?" "9" "15" "12" "6" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/707.jpg" +"708" "A" "What is the color of the flag?" "white" "red" "blue" "green" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/708.jpg" +"709" "B" "What is the color of the flag?" "blue" "white" "red" "green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/709.jpg" +"710" "C" "What is the color of the flag?" "blue" "red" "white" "green" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/710.jpg" +"711" "D" "What is the color of the flag?" "red" "green" "blue" "white" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/711.jpg" +"712" "A" "What is the color of the car?" "red" "white" "blue" "green" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/712.jpg" +"713" "B" "What is the color of the car?" "white" "red" "blue" "green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/713.jpg" +"714" "C" "What is the color of the car?" "green" "blue" "red" "white" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/714.jpg" +"715" "D" "What is the color of the car?" "blue" "white" "green" "red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/715.jpg" +"716" "A" "What is the color of the house?" "white" "red" "green" "blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/716.jpg" +"717" "B" "What is the color of the house?" "blue" "white" "green" "red" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/717.jpg" +"718" "C" "What is the color of the house?" "red" "green" "white" "blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/718.jpg" +"719" "D" "What is the color of the house?" "blue" "red" "green" "white" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/719.jpg" +"720" "A" "How many people are there in the boat?" "Four" "One" "Three" "Two" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/720.jpg" +"721" "B" "How many people are there in the boat?" "Three" "Four" "Two" "One" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/721.jpg" +"722" "C" "How many people are there in the boat?" "Two" "Three" "Four" "One" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/722.jpg" +"723" "D" "How many people are there in the boat?" "Three" "One" "Two" "Four" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/723.jpg" +"724" "A" "What's the color of the car?" "Red" "White" "Green" "Blue" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/724.jpg" +"725" "B" "What's the color of the car?" "White" "Red" "Blue" "Green" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/725.jpg" +"726" "C" "What's the color of the car?" "Green" "White" "Red" "Blue" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/726.jpg" +"727" "D" "What's the color of the car?" "Green" "White" "Blue" "Red" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/727.jpg" +"728" "A" "What piece of equipment is prominently visible in the person's possession?" "A golf bag with golf clubs" "A fishing rod" "A baseball bat" "A tennis racket" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/728.jpg" +"729" "B" "What piece of equipment is prominently visible in the person's possession?" "A tennis racket" "A golf bag with golf clubs" "A baseball bat" "A fishing rod" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/729.jpg" +"730" "C" "What piece of equipment is prominently visible in the person's possession?" "A tennis racket" "A baseball bat" "A golf bag with golf clubs" "A fishing rod" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/730.jpg" +"731" "D" "What piece of equipment is prominently visible in the person's possession?" "A fishing rod" "A tennis racket" "A baseball bat" "A golf bag with golf clubs" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/731.jpg" +"732" "A" "Which country's flag is on the left?" "Germany" "United Kingdom" "American" "Japan" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/732.jpg" +"733" "B" "Which country's flag is on the left?" "American" "Germany" "United Kingdom" "Japan" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/733.jpg" +"734" "C" "Which country's flag is on the left?" "Japan" "American" "Germany" "United Kingdom" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/734.jpg" +"735" "D" "Which country's flag is on the left?" "United Kingdom" "American" "Japan" "Germany" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/735.jpg" +"736" "A" "The flag on the right in the image represents which German federal state?" "Bavaria" "Baden-Württemberg" "Saxony" "Hesse" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/736.jpg" +"737" "B" "The flag on the right in the image represents which German federal state?" "Baden-Württemberg" "Bavaria" "Hesse" "Saxony" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/737.jpg" +"738" "C" "The flag on the right in the image represents which German federal state?" "Baden-Württemberg" "Saxony" "Bavaria" "Hesse" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/738.jpg" +"739" "D" "The flag on the right in the image represents which German federal state?" "Baden-Württemberg" "Hesse" "Saxony" "Bavaria" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/739.jpg" +"740" "A" "Which country's naval ship is depicted in the image based on the flag shown?" "Netherlands" "France" "Germany" "Belgium" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/740.jpg" +"741" "B" "Which country's naval ship is depicted in the image based on the flag shown?" "Belgium" "Netherlands" "France" "Germany" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/741.jpg" +"742" "C" "Which country's naval ship is depicted in the image based on the flag shown?" "Germany" "Belgium" "Netherlands" "France" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/742.jpg" +"743" "D" "Which country's naval ship is depicted in the image based on the flag shown?" "Germany" "Belgium" "France" "Netherlands" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/743.jpg" +"744" "A" "In which country is this license plate registered?" "Iceland" "Norway" "Sweden" "China" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/744.jpg" +"745" "B" "In which country is this license plate registered?" "Norway" "Iceland" "Sweden" "China" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/745.jpg" +"746" "C" "In which country is this license plate registered?" "Norway" "China" "Iceland" "Sweden" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/746.jpg" +"747" "D" "In which country is this license plate registered?" "Sweden" "China" "Norway" "Iceland" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/747.jpg" +"748" "A" "Who is the founder of the company that makes the square white adapter shown in the image?" "Steve Jobs" "Bill Gates" "Jeff Bezos" "Wenbin Wang" "single" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/748.jpg" +"749" "B" "Who is the founder of the company that makes the square white adapter shown in the image?" "Bill Gates" "Steve Jobs" "Wenbin Wang" "Jeff Bezos" "single" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/749.jpg" +"750" "C" "Who is the founder of the company that makes the square white adapter shown in the image?" "Bill Gates" "Jeff Bezos" "Steve Jobs" "Wenbin Wang" "single" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/750.jpg" +"751" "D" "Who is the founder of the company that makes the square white adapter shown in the image?" "Wenbin Wang" "Bill Gates" "Jeff Bezos" "Steve Jobs" "single" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/751.jpg" +"752" "A" "What is the position of the blue backpack relative to the airplane?" "Below and to the left of the airplane" "Below and to the right of the airplane" "Upon and to the left of the airplane" "Upon and to the right of the airplane" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/752.jpg" +"753" "B" "What is the position of the blue backpack relative to the airplane?" "Upon and to the right of the airplane" "Below and to the left of the airplane" "Upon and to the left of the airplane" "Below and to the right of the airplane" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/753.jpg" +"754" "C" "What is the position of the blue backpack relative to the airplane?" "Below and to the right of the airplane" "Upon and to the right of the airplane" "Below and to the left of the airplane" "Upon and to the left of the airplane" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/754.jpg" +"755" "D" "What is the position of the blue backpack relative to the airplane?" "Upon and to the left of the airplane" "Upon and to the right of the airplane" "Below and to the right of the airplane" "Below and to the left of the airplane" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/755.jpg" +"756" "A" "What is the position of the blue backpack relative to the umbrella?" "Below and to the right of the umbrella" "Below and to the left of the umbrella" "Upon and to the left of the umbrella" "Upon and to the right of the umbrella" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/756.jpg" +"757" "B" "What is the position of the blue backpack relative to the umbrella?" "Below and to the left of the umbrella" "Below and to the right of the umbrella" "Upon and to the left of the umbrella" "Upon and to the right of the umbrella" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/757.jpg" +"758" "C" "What is the position of the blue backpack relative to the umbrella?" "Upon and to the left of the umbrella" "Upon and to the right of the umbrella" "Below and to the right of the umbrella" "Below and to the left of the umbrella" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/758.jpg" +"759" "D" "What is the position of the blue backpack relative to the umbrella?" "Upon and to the left of the umbrella" "Upon and to the right of the umbrella" "Below and to the left of the umbrella" "Below and to the right of the umbrella" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/759.jpg" +"760" "A" "What is the position of the blue backpack relative to the wooden box?" "On top of the wooden box" "Below the wooden box" "To the right of the wooden box" "To the left of the wooden box" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/760.jpg" +"761" "B" "What is the position of the blue backpack relative to the wooden box?" "Below the wooden box" "On top of the wooden box" "To the left of the wooden box" "To the right of the wooden box" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/761.jpg" +"762" "C" "What is the position of the blue backpack relative to the wooden box?" "To the left of the wooden box" "To the right of the wooden box" "On top of the wooden box" "Below the wooden box" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/762.jpg" +"763" "D" "What is the position of the blue backpack relative to the wooden box?" "Below the wooden box" "To the right of the wooden box" "To the left of the wooden box" "On top of the wooden box" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/763.jpg" +"764" "A" "What is the position of the wooden jewelry box relative to the clock?" "To the left of the clock" "To the right of the clock" "Over the clock" "Below the clock" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/764.jpg" +"765" "B" "What is the position of the wooden jewelry box relative to the clock?" "To the right of the clock" "To the left of the clock" "Below the clock" "Over the clock" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/765.jpg" +"766" "C" "What is the position of the wooden jewelry box relative to the clock?" "To the right of the clock" "Below the clock" "To the left of the clock" "Over the clock" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/766.jpg" +"767" "D" "What is the position of the wooden jewelry box relative to the clock?" "To the right of the clock" "Below the clock" "Over the clock" "To the left of the clock" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/767.jpg" +"768" "A" "How many chairs are there in the image?" "Two" "One" "Three" "Four" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/768.jpg" +"769" "B" "How many chairs are there in the image?" "One" "Two" "Four" "Three" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/769.jpg" +"770" "C" "How many chairs are there in the image?" "One" "Four" "Two" "Three" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/770.jpg" +"771" "D" "How many chairs are there in the image?" "Three" "One" "Four" "Two" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/771.jpg" +"772" "A" "What direction are the chairs facing in the image?" "The chairs are facing each other" "The chairs are facing towards the staircase" "The chairs are facing the window" "The chairs are facing away from each other" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/772.jpg" +"773" "B" "What direction are the chairs facing in the image?" "The chairs are facing the window" "The chairs are facing each other" "The chairs are facing towards the staircase" "The chairs are facing away from each other" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/773.jpg" +"774" "C" "What direction are the chairs facing in the image?" "The chairs are facing the window" "The chairs are facing towards the staircase" "The chairs are facing each other" "The chairs are facing away from each other" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/774.jpg" +"775" "D" "What direction are the chairs facing in the image?" "The chairs are facing the window" "The chairs are facing away from each other" "The chairs are facing towards the staircase" "The chairs are facing each other" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/775.jpg" +"776" "A" "What is the position of the blue backpack relative to the warning sign?" "To the left of the warning sign" "Below the warning sign" "To the right of the warning sign" "On top of the warning sign" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/776.jpg" +"777" "B" "What is the position of the blue backpack relative to the warning sign?" "To the right of the warning sign" "To the left of the warning sign" "Below the warning sign" "On top of the warning sign" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/777.jpg" +"778" "C" "What is the position of the blue backpack relative to the warning sign?" "Below the warning sign" "To the right of the warning sign" "To the left of the warning sign" "On top of the warning sign" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/778.jpg" +"779" "D" "What is the position of the blue backpack relative to the warning sign?" "Below the warning sign" "To the right of the warning sign" "On top of the warning sign" "To the left of the warning sign" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/779.jpg" +"780" "A" "What is the position of the black car relative to the tram?" "Behind the tram" "In front of the tram" "To the right of the tram" "To the left of the tram" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/780.jpg" +"781" "B" "What is the position of the black car relative to the tram?" "To the left of the tram" "Behind the tram" "In front of the tram" "To the right of the tram" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/781.jpg" +"782" "C" "What is the position of the black car relative to the tram?" "To the left of the tram" "In front of the tram" "Behind the tram" "To the right of the tram" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/782.jpg" +"783" "D" "What is the position of the black car relative to the tram?" "To the left of the tram" "In front of the tram" "To the right of the tram" "Behind the tram" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/783.jpg" +"784" "A" "How many people are there in the image?" "Four" "Two" "Three" "One" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/784.jpg" +"785" "B" "How many people are there in the image?" "Three" "Four" "Two" "One" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/785.jpg" +"786" "C" "How many people are there in the image?" "Three" "One" "Four" "Two" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/786.jpg" +"787" "D" "How many people are there in the image?" "Two" "One" "Three" "Four" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/787.jpg" +"788" "A" "How many people are there in the image?" "Five" "Four" "Two" "Three" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/788.jpg" +"789" "B" "How many people are there in the image?" "Two" "Five" "Four" "Three" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/789.jpg" +"790" "C" "How many people are there in the image?" "Two" "Four" "Five" "Three" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/790.jpg" +"791" "D" "How many people are there in the image?" "Four" "Two" "Three" "Five" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/791.jpg" +"792" "A" "How many people are there in the image?" "Two" "Three" "One" "Four" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/792.jpg" +"793" "B" "How many people are there in the image?" "One" "Two" "Four" "Three" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/793.jpg" +"794" "C" "How many people are there in the image?" "Three" "Four" "Two" "One" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/794.jpg" +"795" "D" "How many people are there in the image?" "One" "Three" "Four" "Two" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/795.jpg" +"796" "A" "What is the position of the boat relative to the buildings?" "To the left of the buildings" "To the right of the buildings" "Below the buildings" "On the top of the buildings" "cross" "0" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/796.jpg" +"797" "B" "What is the position of the boat relative to the buildings?" "Below the buildings" "To the left of the buildings" "On the top of the buildings" "To the right of the buildings" "cross" "1" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/797.jpg" +"798" "C" "What is the position of the boat relative to the buildings?" "On the top of the buildings" "To the right of the buildings" "To the left of the buildings" "Below the buildings" "cross" "2" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/798.jpg" +"799" "D" "What is the position of the boat relative to the buildings?" "On the top of the buildings" "Below the buildings" "To the right of the buildings" "To the left of the buildings" "cross" "3" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/HRBench4K/799.jpg"