diff --git "a/ /AMBER_local.tsv" "b/ /AMBER_local.tsv" new file mode 100644--- /dev/null +++ "b/ /AMBER_local.tsv" @@ -0,0 +1,14217 @@ +"index" "question" "answer" "category" "image_path" +"1005" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1005.jpg" +"1006" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1006.jpg" +"1007" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1007.jpg" +"1008" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1008.jpg" +"1009" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1009.jpg" +"1010" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1010.jpg" +"1011" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1011.jpg" +"1012" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1012.jpg" +"1013" "Are there three people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1013.jpg" +"1014" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1014.jpg" +"1015" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1015.jpg" +"1016" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1016.jpg" +"1017" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1017.jpg" +"1018" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1018.jpg" +"1019" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1019.jpg" +"1020" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1020.jpg" +"1021" "Is the ship white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1021.jpg" +"1022" "Is the ship black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1022.jpg" +"1023" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1023.jpg" +"1024" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1024.jpg" +"1025" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1025.jpg" +"1026" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1026.jpg" +"1027" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1027.jpg" +"1028" "Is the cloud blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1028.jpg" +"1029" "Is the lake calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1029.jpg" +"1030" "Is the lake turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1030.jpg" +"1031" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1031.jpg" +"1032" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1032.jpg" +"1033" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1033.jpg" +"1034" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1034.jpg" +"1035" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1035.jpg" +"1036" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1036.jpg" +"1037" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1037.jpg" +"1038" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1038.jpg" +"1039" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1039.jpg" +"1040" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1040.jpg" +"1041" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1041.jpg" +"1042" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1042.jpg" +"1043" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1043.jpg" +"1044" "Is the lake stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1044.jpg" +"1045" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1045.jpg" +"1046" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1046.jpg" +"1047" "Is there one paddle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1047.jpg" +"1048" "Are there two paddles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1048.jpg" +"1049" "Is the watch black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1049.jpg" +"1050" "Is the watch white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1050.jpg" +"1051" "Does the person jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1051.jpg" +"1052" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1052.jpg" +"1053" "Is the sea turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1053.jpg" +"1054" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1054.jpg" +"1055" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1055.jpg" +"1056" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1056.jpg" +"1057" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1057.jpg" +"1058" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1058.jpg" +"1059" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1059.jpg" +"1060" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1060.jpg" +"1061" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1061.jpg" +"1062" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1062.jpg" +"1063" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1063.jpg" +"1064" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1064.jpg" +"1065" "Is the guardrail short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1065.jpg" +"1066" "Is the guardrail tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1066.jpg" +"1067" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1067.jpg" +"1068" "Is the tree red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1068.jpg" +"1069" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1069.jpg" +"1070" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1070.jpg" +"1071" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1071.jpg" +"1072" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1072.jpg" +"1073" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1073.jpg" +"1074" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1074.jpg" +"1075" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1075.jpg" +"1076" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1076.jpg" +"1077" "Is there one bucket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1077.jpg" +"1078" "Are there two buckets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1078.jpg" +"1079" "Is there one shovel in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1079.jpg" +"1080" "Are there two shovels in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1080.jpg" +"1081" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1081.jpg" +"1082" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1082.jpg" +"1083" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1083.jpg" +"1084" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1084.jpg" +"1085" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1085.jpg" +"1086" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1086.jpg" +"1087" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1087.jpg" +"1088" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1088.jpg" +"1089" "Is there one duck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1089.jpg" +"1090" "Are there two ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1090.jpg" +"1091" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1091.jpg" +"1092" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1092.jpg" +"1093" "Is the hat red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1093.jpg" +"1094" "Is the hat white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1094.jpg" +"1095" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1095.jpg" +"1096" "Are there three footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1096.jpg" +"1097" "Are there two men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1097.jpg" +"1098" "Are there five men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1098.jpg" +"1099" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1099.jpg" +"1100" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1100.jpg" +"1101" "Are there four balls in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1101.jpg" +"1102" "Are there six balls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1102.jpg" +"1103" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1103.jpg" +"1104" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1104.jpg" +"1105" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1105.jpg" +"1106" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1106.jpg" +"1107" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1107.jpg" +"1108" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1108.jpg" +"1109" "Is there one tie in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1109.jpg" +"1110" "Are there two ties in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1110.jpg" +"1111" "Are there three dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1111.jpg" +"1112" "Are there four dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1112.jpg" +"1113" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1113.jpg" +"1114" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1114.jpg" +"1115" "Does the person lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1115.jpg" +"1116" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1116.jpg" +"1117" "Is the grass yellowed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1117.jpg" +"1118" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1118.jpg" +"1119" "Is there one rugby in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1119.jpg" +"1120" "Are there two rugbies in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1120.jpg" +"1121" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1121.jpg" +"1122" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1122.jpg" +"1123" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1123.jpg" +"1124" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1124.jpg" +"1125" "Does the woman laugh in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1125.jpg" +"1126" "Does the woman cry in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1126.jpg" +"1127" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1127.jpg" +"1128" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1128.jpg" +"1129" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1129.jpg" +"1130" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1130.jpg" +"1131" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1131.jpg" +"1132" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1132.jpg" +"1133" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1133.jpg" +"1134" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1134.jpg" +"1135" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1135.jpg" +"1136" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1136.jpg" +"1137" "Is the desert dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1137.jpg" +"1138" "Is the desert wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1138.jpg" +"1139" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1139.jpg" +"1140" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1140.jpg" +"1141" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1141.jpg" +"1142" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1142.jpg" +"1143" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1143.jpg" +"1144" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1144.jpg" +"1145" "Is the hat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1145.jpg" +"1146" "Is the hat blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1146.jpg" +"1147" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1147.jpg" +"1148" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1148.jpg" +"1149" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1149.jpg" +"1150" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1150.jpg" +"1151" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1151.jpg" +"1152" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1152.jpg" +"1153" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1153.jpg" +"1154" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1154.jpg" +"1155" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1155.jpg" +"1156" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1156.jpg" +"1157" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1157.jpg" +"1158" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1158.jpg" +"1159" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1159.jpg" +"1160" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1160.jpg" +"1161" "Is the person surf in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1161.jpg" +"1162" "Is the person swim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1162.jpg" +"1163" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1163.jpg" +"1164" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1164.jpg" +"1165" "Is the sea turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1165.jpg" +"1166" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1166.jpg" +"1167" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1167.jpg" +"1168" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1168.jpg" +"1169" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1169.jpg" +"1170" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1170.jpg" +"1171" "Are there three men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1171.jpg" +"1172" "Are there four men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1172.jpg" +"1173" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1173.jpg" +"1174" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1174.jpg" +"1175" "Is the sky yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1175.jpg" +"1176" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1176.jpg" +"1177" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1177.jpg" +"1178" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1178.jpg" +"1179" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1179.jpg" +"1180" "Is the lake calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1180.jpg" +"1181" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1181.jpg" +"1182" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1182.jpg" +"1183" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1183.jpg" +"1184" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1184.jpg" +"1185" "Are there four women in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1185.jpg" +"1186" "Are there five women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1186.jpg" +"1187" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1187.jpg" +"1188" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1188.jpg" +"1189" "Are there two dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1189.jpg" +"1190" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1190.jpg" +"1191" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1191.jpg" +"1192" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1192.jpg" +"1193" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1193.jpg" +"1194" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1194.jpg" +"1195" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1195.jpg" +"1196" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1196.jpg" +"1197" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1197.jpg" +"1198" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1198.jpg" +"1199" "Does the woman run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1199.jpg" +"1200" "Does the woman walk in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1200.jpg" +"1201" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1201.jpg" +"1202" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1202.jpg" +"1203" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1203.jpg" +"1204" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1204.jpg" +"1205" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1205.jpg" +"1206" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1206.jpg" +"1207" "Is the ball white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1207.jpg" +"1208" "Is the ball black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1208.jpg" +"1209" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1209.jpg" +"1210" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1210.jpg" +"1211" "Is the sign square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1211.jpg" +"1212" "Is the sign round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1212.jpg" +"1213" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1213.jpg" +"1214" "Does the man run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1214.jpg" +"1215" "Is the tree emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1215.jpg" +"1216" "Is the tree yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1216.jpg" +"1217" "Is the fence white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1217.jpg" +"1218" "Is the fence yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1218.jpg" +"1219" "Is the car black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1219.jpg" +"1220" "Is the car white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1220.jpg" +"1221" "Is the lake turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1221.jpg" +"1222" "Is the lake calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1222.jpg" +"1223" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1223.jpg" +"1224" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1224.jpg" +"1225" "Is the ground uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1225.jpg" +"1226" "Is the ground smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1226.jpg" +"1227" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1227.jpg" +"1228" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1228.jpg" +"1229" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1229.jpg" +"1230" "Does the child run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1230.jpg" +"1231" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1231.jpg" +"1232" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1232.jpg" +"1233" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1233.jpg" +"1234" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1234.jpg" +"1235" "Is the ground smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1235.jpg" +"1236" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1236.jpg" +"1237" "Is the motorbike starting in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1237.jpg" +"1238" "Is the motorbike closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1238.jpg" +"1239" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1239.jpg" +"1240" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1240.jpg" +"1241" "Is the hat red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1241.jpg" +"1242" "Is the hat black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1242.jpg" +"1243" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1243.jpg" +"1244" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1244.jpg" +"1245" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1245.jpg" +"1246" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1246.jpg" +"1247" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1247.jpg" +"1248" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1248.jpg" +"1249" "Is the ground smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1249.jpg" +"1250" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1250.jpg" +"1251" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1251.jpg" +"1252" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1252.jpg" +"1253" "Is the ground smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1253.jpg" +"1254" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1254.jpg" +"1255" "Is the motorbike starting in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1255.jpg" +"1256" "Is the motorbike closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1256.jpg" +"1257" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1257.jpg" +"1258" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1258.jpg" +"1259" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1259.jpg" +"1260" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1260.jpg" +"1261" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1261.jpg" +"1262" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1262.jpg" +"1263" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1263.jpg" +"1264" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1264.jpg" +"1265" "Does the child run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1265.jpg" +"1266" "Does the child walk in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1266.jpg" +"1267" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1267.jpg" +"1268" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1268.jpg" +"1269" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1269.jpg" +"1270" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1270.jpg" +"1271" "Is the child run in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1271.jpg" +"1272" "Is the child sit in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1272.jpg" +"1273" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1273.jpg" +"1274" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1274.jpg" +"1275" "Is the sea rolling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1275.jpg" +"1276" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1276.jpg" +"1277" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1277.jpg" +"1278" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1278.jpg" +"1279" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1279.jpg" +"1280" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1280.jpg" +"1281" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1281.jpg" +"1282" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1282.jpg" +"1283" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1283.jpg" +"1284" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1284.jpg" +"1285" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1285.jpg" +"1286" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1286.jpg" +"1287" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1287.jpg" +"1288" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1288.jpg" +"1289" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1289.jpg" +"1290" "Does the person dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1290.jpg" +"1291" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1291.jpg" +"1292" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1292.jpg" +"1293" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1293.jpg" +"1294" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1294.jpg" +"1295" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1295.jpg" +"1296" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1296.jpg" +"1297" "Does the person play soccer in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1297.jpg" +"1298" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1298.jpg" +"1299" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1299.jpg" +"1300" "Are there three glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1300.jpg" +"1301" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1301.jpg" +"1302" "Is the grass on the brink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1302.jpg" +"1303" "Is the sky vast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1303.jpg" +"1304" "Is the sky jet-black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1304.jpg" +"1305" "Is the cloud colorful in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1305.jpg" +"1306" "Is the cloud cloudy skies in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1306.jpg" +"1307" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1307.jpg" +"1308" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1308.jpg" +"1309" "Is the sea purple in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1309.jpg" +"1310" "Is the sea blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1310.jpg" +"1311" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1311.jpg" +"1312" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1312.jpg" +"1313" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1313.jpg" +"1314" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1314.jpg" +"1315" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1315.jpg" +"1316" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1316.jpg" +"1317" "Is the forest yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1317.jpg" +"1318" "Is the forest blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1318.jpg" +"1319" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1319.jpg" +"1320" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1320.jpg" +"1321" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1321.jpg" +"1322" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1322.jpg" +"1323" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1323.jpg" +"1324" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1324.jpg" +"1325" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1325.jpg" +"1326" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1326.jpg" +"1327" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1327.jpg" +"1328" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1328.jpg" +"1329" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1329.jpg" +"1330" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1330.jpg" +"1331" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1331.jpg" +"1332" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1332.jpg" +"1333" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1333.jpg" +"1334" "Does the person dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1334.jpg" +"1335" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1335.jpg" +"1336" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1336.jpg" +"1337" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1337.jpg" +"1338" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1338.jpg" +"1339" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1339.jpg" +"1340" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1340.jpg" +"1341" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1341.jpg" +"1342" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1342.jpg" +"1343" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1343.jpg" +"1344" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1344.jpg" +"1345" "Is the flower vibrant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1345.jpg" +"1346" "Is the flower plain in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1346.jpg" +"1347" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1347.jpg" +"1348" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1348.jpg" +"1349" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1349.jpg" +"1350" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1350.jpg" +"1351" "Is the wall dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1351.jpg" +"1352" "Is the wall clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1352.jpg" +"1353" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1353.jpg" +"1354" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1354.jpg" +"1355" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1355.jpg" +"1356" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1356.jpg" +"1357" "Is the forest withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1357.jpg" +"1358" "Is the forest lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1358.jpg" +"1359" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1359.jpg" +"1360" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1360.jpg" +"1361" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1361.jpg" +"1362" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1362.jpg" +"1363" "Is there one house in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1363.jpg" +"1364" "Are there two houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1364.jpg" +"1365" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1365.jpg" +"1366" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1366.jpg" +"1367" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1367.jpg" +"1368" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1368.jpg" +"1369" "Are there two sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1369.jpg" +"1370" "Are there three sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1370.jpg" +"1371" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1371.jpg" +"1372" "Is the tree blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1372.jpg" +"1373" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1373.jpg" +"1374" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1374.jpg" +"1375" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1375.jpg" +"1376" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1376.jpg" +"1377" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1377.jpg" +"1378" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1378.jpg" +"1379" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1379.jpg" +"1380" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1380.jpg" +"1381" "Is the road clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1381.jpg" +"1382" "Is the road dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1382.jpg" +"1383" "Is the dog black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1383.jpg" +"1384" "Is the dog blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1384.jpg" +"1385" "Is the person run in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1385.jpg" +"1386" "Is the person jump in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1386.jpg" +"1387" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1387.jpg" +"1388" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1388.jpg" +"1389" "Is the floor tiled in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1389.jpg" +"1390" "Is the floor wooden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1390.jpg" +"1391" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1391.jpg" +"1392" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1392.jpg" +"1393" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1393.jpg" +"1394" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1394.jpg" +"1395" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1395.jpg" +"1396" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1396.jpg" +"1397" "Does the person crouch in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1397.jpg" +"1398" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1398.jpg" +"1399" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1399.jpg" +"1400" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1400.jpg" +"1401" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1401.jpg" +"1402" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1402.jpg" +"1403" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1403.jpg" +"1404" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1404.jpg" +"1405" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1405.jpg" +"1406" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1406.jpg" +"1407" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1407.jpg" +"1408" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1408.jpg" +"1409" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1409.jpg" +"1410" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1410.jpg" +"1411" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1411.jpg" +"1412" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1412.jpg" +"1413" "Does the person lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1413.jpg" +"1414" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1414.jpg" +"1415" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1415.jpg" +"1416" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1416.jpg" +"1417" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1417.jpg" +"1418" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1418.jpg" +"1419" "Is the fence short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1419.jpg" +"1420" "Is the fence tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1420.jpg" +"1421" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1421.jpg" +"1422" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1422.jpg" +"1423" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1423.jpg" +"1424" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1424.jpg" +"1425" "Is the hat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1425.jpg" +"1426" "Is the hat red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1426.jpg" +"1427" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1427.jpg" +"1428" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1428.jpg" +"1429" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1429.jpg" +"1430" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1430.jpg" +"1431" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1431.jpg" +"1432" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1432.jpg" +"1433" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1433.jpg" +"1434" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1434.jpg" +"1435" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1435.jpg" +"1436" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1436.jpg" +"1437" "Is the ball colorful in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1437.jpg" +"1438" "Is the ball monochromatic in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1438.jpg" +"1439" "Is there one child in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1439.jpg" +"1440" "Are there two children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1440.jpg" +"1441" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1441.jpg" +"1442" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1442.jpg" +"1443" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1443.jpg" +"1444" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1444.jpg" +"1445" "Does the man play the piano in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1445.jpg" +"1446" "Does the man perform in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1446.jpg" +"1447" "Is there one guitar in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1447.jpg" +"1448" "Are there two guitars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1448.jpg" +"1449" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1449.jpg" +"1450" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1450.jpg" +"1451" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1451.jpg" +"1452" "Does the dog walking in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1452.jpg" +"1453" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1453.jpg" +"1454" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1454.jpg" +"1455" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1455.jpg" +"1456" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1456.jpg" +"1457" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1457.jpg" +"1458" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1458.jpg" +"1459" "Does the child lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1459.jpg" +"1460" "Does the child run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1460.jpg" +"1461" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1461.jpg" +"1462" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1462.jpg" +"1463" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1463.jpg" +"1464" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1464.jpg" +"1465" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1465.jpg" +"1466" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1466.jpg" +"1467" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1467.jpg" +"1468" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1468.jpg" +"1469" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1469.jpg" +"1470" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1470.jpg" +"1471" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1471.jpg" +"1472" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1472.jpg" +"1473" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1473.jpg" +"1474" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1474.jpg" +"1475" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1475.jpg" +"1476" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1476.jpg" +"1477" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1477.jpg" +"1478" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1478.jpg" +"1479" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1479.jpg" +"1480" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1480.jpg" +"1481" "Is the flower fresh in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1481.jpg" +"1482" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1482.jpg" +"1483" "Is there one flowerpot in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1483.jpg" +"1484" "Are there two flowerpots in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1484.jpg" +"1485" "Is the ground tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1485.jpg" +"1486" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1486.jpg" +"1487" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1487.jpg" +"1488" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1488.jpg" +"1489" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1489.jpg" +"1490" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1490.jpg" +"1491" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1491.jpg" +"1492" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1492.jpg" +"1493" "Does the dog jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1493.jpg" +"1494" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1494.jpg" +"1495" "Is there one ball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1495.jpg" +"1496" "Are there two balls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1496.jpg" +"1497" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1497.jpg" +"1498" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1498.jpg" +"1499" "Is the book open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1499.jpg" +"1500" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1500.jpg" +"1501" "Is there one notebook in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1501.jpg" +"1502" "Are there two notebooks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1502.jpg" +"1503" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1503.jpg" +"1504" "Are there two pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1504.jpg" +"1505" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1505.jpg" +"1506" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1506.jpg" +"1507" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1507.jpg" +"1508" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1508.jpg" +"1509" "Is the ground muddy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1509.jpg" +"1510" "Is the ground flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1510.jpg" +"1511" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1511.jpg" +"1512" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1512.jpg" +"1513" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1513.jpg" +"1514" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1514.jpg" +"1515" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1515.jpg" +"1516" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1516.jpg" +"1517" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1517.jpg" +"1518" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1518.jpg" +"1519" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1519.jpg" +"1520" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1520.jpg" +"1521" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1521.jpg" +"1522" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1522.jpg" +"1523" "Are there two dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1523.jpg" +"1524" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1524.jpg" +"1525" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1525.jpg" +"1526" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1526.jpg" +"1527" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1527.jpg" +"1528" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1528.jpg" +"1529" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1529.jpg" +"1530" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1530.jpg" +"1531" "Is there one camera in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1531.jpg" +"1532" "Are there two cameras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1532.jpg" +"1533" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1533.jpg" +"1534" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1534.jpg" +"1535" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1535.jpg" +"1536" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1536.jpg" +"1537" "Are there three dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1537.jpg" +"1538" "Are there four dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1538.jpg" +"1539" "Is there one ball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1539.jpg" +"1540" "Are there two balls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1540.jpg" +"1541" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1541.jpg" +"1542" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1542.jpg" +"1543" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1543.jpg" +"1544" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1544.jpg" +"1545" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1545.jpg" +"1546" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1546.jpg" +"1547" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1547.jpg" +"1548" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1548.jpg" +"1549" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1549.jpg" +"1550" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1550.jpg" +"1551" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1551.jpg" +"1552" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1552.jpg" +"1553" "Does the person cycling in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1553.jpg" +"1554" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1554.jpg" +"1555" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1555.jpg" +"1556" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1556.jpg" +"1557" "Is the ground yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1557.jpg" +"1558" "Is the ground red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1558.jpg" +"1559" "Is the forest yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1559.jpg" +"1560" "Is the forest green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1560.jpg" +"1561" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1561.jpg" +"1562" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1562.jpg" +"1563" "Is the ground muddy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1563.jpg" +"1564" "Is the ground concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1564.jpg" +"1565" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1565.jpg" +"1566" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1566.jpg" +"1567" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1567.jpg" +"1568" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1568.jpg" +"1569" "Is the fence tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1569.jpg" +"1570" "Is the fence short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1570.jpg" +"1571" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1571.jpg" +"1572" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1572.jpg" +"1573" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1573.jpg" +"1574" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1574.jpg" +"1575" "Does the woman ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1575.jpg" +"1576" "Does the woman dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1576.jpg" +"1577" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1577.jpg" +"1578" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1578.jpg" +"1579" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1579.jpg" +"1580" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1580.jpg" +"1581" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1581.jpg" +"1582" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1582.jpg" +"1583" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1583.jpg" +"1584" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1584.jpg" +"1585" "Does the child climb a tree in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1585.jpg" +"1586" "Does the child ride a bike in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1586.jpg" +"1587" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1587.jpg" +"1588" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1588.jpg" +"1589" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1589.jpg" +"1590" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1590.jpg" +"1591" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1591.jpg" +"1592" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1592.jpg" +"1593" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1593.jpg" +"1594" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1594.jpg" +"1595" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1595.jpg" +"1596" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1596.jpg" +"1597" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1597.jpg" +"1598" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1598.jpg" +"1599" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1599.jpg" +"1600" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1600.jpg" +"1601" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1601.jpg" +"1602" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1602.jpg" +"1603" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1603.jpg" +"1604" "Is the forest blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1604.jpg" +"1605" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1605.jpg" +"1606" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1606.jpg" +"1607" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1607.jpg" +"1608" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1608.jpg" +"1609" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1609.jpg" +"1610" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1610.jpg" +"1611" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1611.jpg" +"1612" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1612.jpg" +"1613" "Is the hydrant red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1613.jpg" +"1614" "Is the hydrant white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1614.jpg" +"1615" "Are there two dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1615.jpg" +"1616" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1616.jpg" +"1617" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1617.jpg" +"1618" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1618.jpg" +"1619" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1619.jpg" +"1620" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1620.jpg" +"1621" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1621.jpg" +"1622" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1622.jpg" +"1623" "Is the river rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1623.jpg" +"1624" "Is the river rolling waves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1624.jpg" +"1625" "Does the person row a boat in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1625.jpg" +"1626" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1626.jpg" +"1627" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1627.jpg" +"1628" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1628.jpg" +"1629" "Is the paddle yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1629.jpg" +"1630" "Is the paddle black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1630.jpg" +"1631" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1631.jpg" +"1632" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1632.jpg" +"1633" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1633.jpg" +"1634" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1634.jpg" +"1635" "Does the child sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1635.jpg" +"1636" "Does the child stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1636.jpg" +"1637" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1637.jpg" +"1638" "Are there two toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1638.jpg" +"1639" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1639.jpg" +"1640" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1640.jpg" +"1641" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1641.jpg" +"1642" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1642.jpg" +"1643" "Are there three people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1643.jpg" +"1644" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1644.jpg" +"1645" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1645.jpg" +"1646" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1646.jpg" +"1647" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1647.jpg" +"1648" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1648.jpg" +"1649" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1649.jpg" +"1650" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1650.jpg" +"1651" "Are there two men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1651.jpg" +"1652" "Are there three men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1652.jpg" +"1653" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1653.jpg" +"1654" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1654.jpg" +"1655" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1655.jpg" +"1656" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1656.jpg" +"1657" "Is the forest withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1657.jpg" +"1658" "Is the forest lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1658.jpg" +"1659" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1659.jpg" +"1660" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1660.jpg" +"1661" "Are there two children in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1661.jpg" +"1662" "Are there three children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1662.jpg" +"1663" "Is the ground curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1663.jpg" +"1664" "Is the ground straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1664.jpg" +"1665" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1665.jpg" +"1666" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1666.jpg" +"1667" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1667.jpg" +"1668" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1668.jpg" +"1669" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1669.jpg" +"1670" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1670.jpg" +"1671" "Does the person play soccer in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1671.jpg" +"1672" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1672.jpg" +"1673" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1673.jpg" +"1674" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1674.jpg" +"1675" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1675.jpg" +"1676" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1676.jpg" +"1677" "Does the man surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1677.jpg" +"1678" "Does the man dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1678.jpg" +"1679" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1679.jpg" +"1680" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1680.jpg" +"1681" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1681.jpg" +"1682" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1682.jpg" +"1683" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1683.jpg" +"1684" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1684.jpg" +"1685" "Are there three people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1685.jpg" +"1686" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1686.jpg" +"1687" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1687.jpg" +"1688" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1688.jpg" +"1689" "Is there one shampoo in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1689.jpg" +"1690" "Are there two shampoos in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1690.jpg" +"1691" "Is there one child in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1691.jpg" +"1692" "Are there two children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1692.jpg" +"1693" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1693.jpg" +"1694" "Is the bath black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1694.jpg" +"1695" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1695.jpg" +"1696" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1696.jpg" +"1697" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1697.jpg" +"1698" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1698.jpg" +"1699" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1699.jpg" +"1700" "Is the bath black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1700.jpg" +"1701" "Does the man lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1701.jpg" +"1702" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1702.jpg" +"1703" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1703.jpg" +"1704" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1704.jpg" +"1705" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1705.jpg" +"1706" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1706.jpg" +"1707" "Is there one ball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1707.jpg" +"1708" "Are there two balls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1708.jpg" +"1709" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1709.jpg" +"1710" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1710.jpg" +"1711" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1711.jpg" +"1712" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1712.jpg" +"1713" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1713.jpg" +"1714" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1714.jpg" +"1715" "Does the person horseback riding in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1715.jpg" +"1716" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1716.jpg" +"1717" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1717.jpg" +"1718" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1718.jpg" +"1719" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1719.jpg" +"1720" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1720.jpg" +"1721" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1721.jpg" +"1722" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1722.jpg" +"1723" "Is the sky deep blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1723.jpg" +"1724" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1724.jpg" +"1725" "Is the telescope blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1725.jpg" +"1726" "Is the telescope black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1726.jpg" +"1727" "Is the ground gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1727.jpg" +"1728" "Is the ground yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1728.jpg" +"1729" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1729.jpg" +"1730" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1730.jpg" +"1731" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1731.jpg" +"1732" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1732.jpg" +"1733" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1733.jpg" +"1734" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1734.jpg" +"1735" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1735.jpg" +"1736" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1736.jpg" +"1737" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1737.jpg" +"1738" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1738.jpg" +"1739" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1739.jpg" +"1740" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1740.jpg" +"1741" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1741.jpg" +"1742" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1742.jpg" +"1743" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1743.jpg" +"1744" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1744.jpg" +"1745" "Is there one bottle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1745.jpg" +"1746" "Are there two bottles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1746.jpg" +"1747" "Does the snow white in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1747.jpg" +"1748" "Does the snow blue in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1748.jpg" +"1749" "Is there one backpack in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1749.jpg" +"1750" "Are there two backpacks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1750.jpg" +"1751" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1751.jpg" +"1752" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1752.jpg" +"1753" "Does the person lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1753.jpg" +"1754" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1754.jpg" +"1755" "Is there one camera in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1755.jpg" +"1756" "Are there two cameras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1756.jpg" +"1757" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1757.jpg" +"1758" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1758.jpg" +"1759" "Are there two motorbikes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1759.jpg" +"1760" "Are there four motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1760.jpg" +"1761" "Is the stair gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1761.jpg" +"1762" "Is the stair white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1762.jpg" +"1763" "Is the lake rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1763.jpg" +"1764" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1764.jpg" +"1765" "Does the dog swim in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1765.jpg" +"1766" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1766.jpg" +"1767" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1767.jpg" +"1768" "Are there two toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1768.jpg" +"1769" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1769.jpg" +"1770" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1770.jpg" +"1771" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1771.jpg" +"1772" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1772.jpg" +"1773" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1773.jpg" +"1774" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1774.jpg" +"1775" "Is the person surf in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1775.jpg" +"1776" "Is the person swim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1776.jpg" +"1777" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1777.jpg" +"1778" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1778.jpg" +"1779" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1779.jpg" +"1780" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1780.jpg" +"1781" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1781.jpg" +"1782" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1782.jpg" +"1783" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1783.jpg" +"1784" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1784.jpg" +"1785" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1785.jpg" +"1786" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1786.jpg" +"1787" "Is there one bus in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1787.jpg" +"1788" "Are there two buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1788.jpg" +"1789" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1789.jpg" +"1790" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1790.jpg" +"1791" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1791.jpg" +"1792" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1792.jpg" +"1793" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1793.jpg" +"1794" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1794.jpg" +"1795" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1795.jpg" +"1796" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1796.jpg" +"1797" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1797.jpg" +"1798" "Is the sun soft in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1798.jpg" +"1799" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1799.jpg" +"1800" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1800.jpg" +"1801" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1801.jpg" +"1802" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1802.jpg" +"1803" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1803.jpg" +"1804" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1804.jpg" +"1805" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1805.jpg" +"1806" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1806.jpg" +"1807" "Is the wall rough in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1807.jpg" +"1808" "Is the wall smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1808.jpg" +"1809" "Is the door blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1809.jpg" +"1810" "Is the door white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1810.jpg" +"1811" "Does the man lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1811.jpg" +"1812" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1812.jpg" +"1813" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1813.jpg" +"1814" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1814.jpg" +"1815" "Is there one cone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1815.jpg" +"1816" "Are there two cones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1816.jpg" +"1817" "Does the beach uneven in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1817.jpg" +"1818" "Does the beach flat in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1818.jpg" +"1819" "Does the man jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1819.jpg" +"1820" "Does the man run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1820.jpg" +"1821" "Is there one volleyball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1821.jpg" +"1822" "Are there two volleyballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1822.jpg" +"1823" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1823.jpg" +"1824" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1824.jpg" +"1825" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1825.jpg" +"1826" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1826.jpg" +"1827" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1827.jpg" +"1828" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1828.jpg" +"1829" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1829.jpg" +"1830" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1830.jpg" +"1831" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1831.jpg" +"1832" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1832.jpg" +"1833" "Does the woman ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1833.jpg" +"1834" "Does the woman swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1834.jpg" +"1835" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1835.jpg" +"1836" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1836.jpg" +"1837" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1837.jpg" +"1838" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1838.jpg" +"1839" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1839.jpg" +"1840" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1840.jpg" +"1841" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1841.jpg" +"1842" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1842.jpg" +"1843" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1843.jpg" +"1844" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1844.jpg" +"1845" "Does the woman run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1845.jpg" +"1846" "Does the woman dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1846.jpg" +"1847" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1847.jpg" +"1848" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1848.jpg" +"1849" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1849.jpg" +"1850" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1850.jpg" +"1851" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1851.jpg" +"1852" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1852.jpg" +"1853" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1853.jpg" +"1854" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1854.jpg" +"1855" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1855.jpg" +"1856" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1856.jpg" +"1857" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1857.jpg" +"1858" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1858.jpg" +"1859" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1859.jpg" +"1860" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1860.jpg" +"1861" "Is the flag fluttering in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1861.jpg" +"1862" "Is the flag motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1862.jpg" +"1863" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1863.jpg" +"1864" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1864.jpg" +"1865" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1865.jpg" +"1866" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1866.jpg" +"1867" "Is the person sit in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1867.jpg" +"1868" "Is the person stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1868.jpg" +"1869" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1869.jpg" +"1870" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1870.jpg" +"1871" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1871.jpg" +"1872" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1872.jpg" +"1873" "Are there three men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1873.jpg" +"1874" "Are there four men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1874.jpg" +"1875" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1875.jpg" +"1876" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1876.jpg" +"1877" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1877.jpg" +"1878" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1878.jpg" +"1879" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1879.jpg" +"1880" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1880.jpg" +"1881" "Are there two men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1881.jpg" +"1882" "Are there three men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1882.jpg" +"1883" "Is the glove black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1883.jpg" +"1884" "Is the glove white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1884.jpg" +"1885" "Are there two flags in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1885.jpg" +"1886" "Are there three flags in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1886.jpg" +"1887" "Is the wall red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1887.jpg" +"1888" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1888.jpg" +"1889" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1889.jpg" +"1890" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1890.jpg" +"1891" "Is there one guitar in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1891.jpg" +"1892" "Are there two guitars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1892.jpg" +"1893" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1893.jpg" +"1894" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1894.jpg" +"1895" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1895.jpg" +"1896" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1896.jpg" +"1897" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1897.jpg" +"1898" "Is the sea turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1898.jpg" +"1899" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1899.jpg" +"1900" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1900.jpg" +"1901" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1901.jpg" +"1902" "Does the dog jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1902.jpg" +"1903" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1903.jpg" +"1904" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1904.jpg" +"1905" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1905.jpg" +"1906" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1906.jpg" +"1907" "Does the man swim in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1907.jpg" +"1908" "Does the man dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1908.jpg" +"1909" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1909.jpg" +"1910" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1910.jpg" +"1911" "Are there two women in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1911.jpg" +"1912" "Are there three women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1912.jpg" +"1913" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1913.jpg" +"1914" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1914.jpg" +"1915" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1915.jpg" +"1916" "Is the lake stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1916.jpg" +"1917" "Is the ship blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1917.jpg" +"1918" "Is the ship red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1918.jpg" +"1919" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1919.jpg" +"1920" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1920.jpg" +"1921" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1921.jpg" +"1922" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1922.jpg" +"1923" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1923.jpg" +"1924" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1924.jpg" +"1925" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1925.jpg" +"1926" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1926.jpg" +"1927" "Is the man sit in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1927.jpg" +"1928" "Is the man stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1928.jpg" +"1929" "Is there one backpack in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1929.jpg" +"1930" "Are there two backpacks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1930.jpg" +"1931" "Is the ground uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1931.jpg" +"1932" "Is the ground flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1932.jpg" +"1933" "Does the woman sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1933.jpg" +"1934" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1934.jpg" +"1935" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1935.jpg" +"1936" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1936.jpg" +"1937" "Does the woman lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1937.jpg" +"1938" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1938.jpg" +"1939" "Is there one camera in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1939.jpg" +"1940" "Are there two cameras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1940.jpg" +"1941" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1941.jpg" +"1942" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1942.jpg" +"1943" "Is the watch black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1943.jpg" +"1944" "Is the watch white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1944.jpg" +"1945" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1945.jpg" +"1946" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1946.jpg" +"1947" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1947.jpg" +"1948" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1948.jpg" +"1949" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1949.jpg" +"1950" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1950.jpg" +"1951" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1951.jpg" +"1952" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1952.jpg" +"1953" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1953.jpg" +"1954" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1954.jpg" +"1955" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1955.jpg" +"1956" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1956.jpg" +"1957" "Are there three children in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1957.jpg" +"1958" "Are there four children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1958.jpg" +"1959" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1959.jpg" +"1960" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1960.jpg" +"1961" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1961.jpg" +"1962" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1962.jpg" +"1963" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1963.jpg" +"1964" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1964.jpg" +"1965" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1965.jpg" +"1966" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1966.jpg" +"1967" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1967.jpg" +"1968" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1968.jpg" +"1969" "Does the child run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1969.jpg" +"1970" "Does the child stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1970.jpg" +"1971" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1971.jpg" +"1972" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1972.jpg" +"1973" "Are there two women in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1973.jpg" +"1974" "Are there three women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1974.jpg" +"1975" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1975.jpg" +"1976" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1976.jpg" +"1977" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1977.jpg" +"1978" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1978.jpg" +"1979" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1979.jpg" +"1980" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1980.jpg" +"1981" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1981.jpg" +"1982" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1982.jpg" +"1983" "Is the grass yellowed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1983.jpg" +"1984" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1984.jpg" +"1985" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1985.jpg" +"1986" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1986.jpg" +"1987" "Does the man take a photo in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1987.jpg" +"1988" "Does the man sing in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1988.jpg" +"1989" "Is there one camera in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1989.jpg" +"1990" "Are there two cameras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1990.jpg" +"1991" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1991.jpg" +"1992" "Are there three glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1992.jpg" +"1993" "Is there one watch in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1993.jpg" +"1994" "Are there two watches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1994.jpg" +"1995" "Does the woman laugh in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1995.jpg" +"1996" "Does the woman cry in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1996.jpg" +"1997" "Is there one microphone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1997.jpg" +"1998" "Are there two microphones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1998.jpg" +"1999" "Is there one support in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/1999.jpg" +"2000" "Are there two supports in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2000.jpg" +"2001" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2001.jpg" +"2002" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2002.jpg" +"2003" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2003.jpg" +"2004" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2004.jpg" +"2005" "Does the person walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2005.jpg" +"2006" "Does the person jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2006.jpg" +"2007" "Is there one flag in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2007.jpg" +"2008" "Are there two flags in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2008.jpg" +"2009" "Does the person write in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2009.jpg" +"2010" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2010.jpg" +"2011" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2011.jpg" +"2012" "Are there two pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2012.jpg" +"2013" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2013.jpg" +"2014" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2014.jpg" +"2015" "Is the table yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2015.jpg" +"2016" "Is the table red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2016.jpg" +"2017" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2017.jpg" +"2018" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2018.jpg" +"2019" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2019.jpg" +"2020" "Is the lake stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2020.jpg" +"2021" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2021.jpg" +"2022" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2022.jpg" +"2023" "Does the person go fishing in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2023.jpg" +"2024" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2024.jpg" +"2025" "Is there one rod in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2025.jpg" +"2026" "Are there two rods in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2026.jpg" +"2027" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2027.jpg" +"2028" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2028.jpg" +"2029" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2029.jpg" +"2030" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2030.jpg" +"2031" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2031.jpg" +"2032" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2032.jpg" +"2033" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2033.jpg" +"2034" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2034.jpg" +"2035" "Is the desert dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2035.jpg" +"2036" "Is the desert wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2036.jpg" +"2037" "Does the woman jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2037.jpg" +"2038" "Does the woman lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2038.jpg" +"2039" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2039.jpg" +"2040" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2040.jpg" +"2041" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2041.jpg" +"2042" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2042.jpg" +"2043" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2043.jpg" +"2044" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2044.jpg" +"2045" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2045.jpg" +"2046" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2046.jpg" +"2047" "Does the man jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2047.jpg" +"2048" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2048.jpg" +"2049" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2049.jpg" +"2050" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2050.jpg" +"2051" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2051.jpg" +"2052" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2052.jpg" +"2053" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2053.jpg" +"2054" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2054.jpg" +"2055" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2055.jpg" +"2056" "Is the sky purple in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2056.jpg" +"2057" "Is the cloud pristine in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2057.jpg" +"2058" "Is the cloud filthy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2058.jpg" +"2059" "Is there one tent in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2059.jpg" +"2060" "Are there two tents in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2060.jpg" +"2061" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2061.jpg" +"2062" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2062.jpg" +"2063" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2063.jpg" +"2064" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2064.jpg" +"2065" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2065.jpg" +"2066" "Is the sky red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2066.jpg" +"2067" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2067.jpg" +"2068" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2068.jpg" +"2069" "Is the sun gentle in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2069.jpg" +"2070" "Is the sun dazzling in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2070.jpg" +"2071" "Is the sea calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2071.jpg" +"2072" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2072.jpg" +"2073" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2073.jpg" +"2074" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2074.jpg" +"2075" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2075.jpg" +"2076" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2076.jpg" +"2077" "Is the sky dim in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2077.jpg" +"2078" "Is the sky bright in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2078.jpg" +"2079" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2079.jpg" +"2080" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2080.jpg" +"2081" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2081.jpg" +"2082" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2082.jpg" +"2083" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2083.jpg" +"2084" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2084.jpg" +"2085" "Does the man climb a tree in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2085.jpg" +"2086" "Does the man dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2086.jpg" +"2087" "Does the woman lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2087.jpg" +"2088" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2088.jpg" +"2089" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2089.jpg" +"2090" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2090.jpg" +"2091" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2091.jpg" +"2092" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2092.jpg" +"2093" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2093.jpg" +"2094" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2094.jpg" +"2095" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2095.jpg" +"2096" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2096.jpg" +"2097" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2097.jpg" +"2098" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2098.jpg" +"2099" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2099.jpg" +"2100" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2100.jpg" +"2101" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2101.jpg" +"2102" "Are there two knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2102.jpg" +"2103" "Is there one coconut in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2103.jpg" +"2104" "Are there two coconuts in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2104.jpg" +"2105" "Are there two men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2105.jpg" +"2106" "Are there three men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2106.jpg" +"2107" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2107.jpg" +"2108" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2108.jpg" +"2109" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2109.jpg" +"2110" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2110.jpg" +"2111" "Is the car red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2111.jpg" +"2112" "Is the car white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2112.jpg" +"2113" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2113.jpg" +"2114" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2114.jpg" +"2115" "Is the bush sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2115.jpg" +"2116" "Is the bush dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2116.jpg" +"2117" "Is the grass sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2117.jpg" +"2118" "Is the grass lush in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2118.jpg" +"2119" "Are there two children in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2119.jpg" +"2120" "Are there three children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2120.jpg" +"2121" "Is the sea rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2121.jpg" +"2122" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2122.jpg" +"2123" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2123.jpg" +"2124" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2124.jpg" +"2125" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2125.jpg" +"2126" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2126.jpg" +"2127" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2127.jpg" +"2128" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2128.jpg" +"2129" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2129.jpg" +"2130" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2130.jpg" +"2131" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2131.jpg" +"2132" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2132.jpg" +"2133" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2133.jpg" +"2134" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2134.jpg" +"2135" "Is the desert yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2135.jpg" +"2136" "Is the desert black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2136.jpg" +"2137" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2137.jpg" +"2138" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2138.jpg" +"2139" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2139.jpg" +"2140" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2140.jpg" +"2141" "Is there one child in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2141.jpg" +"2142" "Are there two children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2142.jpg" +"2143" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2143.jpg" +"2144" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2144.jpg" +"2145" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2145.jpg" +"2146" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2146.jpg" +"2147" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2147.jpg" +"2148" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2148.jpg" +"2149" "Is the lake calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2149.jpg" +"2150" "Is the lake rolling in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2150.jpg" +"2151" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2151.jpg" +"2152" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2152.jpg" +"2153" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2153.jpg" +"2154" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2154.jpg" +"2155" "Are there two bicycles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2155.jpg" +"2156" "Are there three bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2156.jpg" +"2157" "Are there two children in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2157.jpg" +"2158" "Are there three children in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2158.jpg" +"2159" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2159.jpg" +"2160" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2160.jpg" +"2161" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2161.jpg" +"2162" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2162.jpg" +"2163" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2163.jpg" +"2164" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2164.jpg" +"2165" "Does the woman jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2165.jpg" +"2166" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2166.jpg" +"2167" "Is the grass yellowed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2167.jpg" +"2168" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2168.jpg" +"2169" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2169.jpg" +"2170" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2170.jpg" +"2171" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2171.jpg" +"2172" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2172.jpg" +"2173" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2173.jpg" +"2174" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2174.jpg" +"2175" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2175.jpg" +"2176" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2176.jpg" +"2177" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2177.jpg" +"2178" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2178.jpg" +"2179" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2179.jpg" +"2180" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2180.jpg" +"2181" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2181.jpg" +"2182" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2182.jpg" +"2183" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2183.jpg" +"2184" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2184.jpg" +"2185" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2185.jpg" +"2186" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2186.jpg" +"2187" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2187.jpg" +"2188" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2188.jpg" +"2189" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2189.jpg" +"2190" "Is the sun soft in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2190.jpg" +"2191" "Is the desert dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2191.jpg" +"2192" "Is the desert wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2192.jpg" +"2193" "Are there three camels in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2193.jpg" +"2194" "Are there four camels in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2194.jpg" +"2195" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2195.jpg" +"2196" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2196.jpg" +"2197" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2197.jpg" +"2198" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2198.jpg" +"2199" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2199.jpg" +"2200" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2200.jpg" +"2201" "Is the sky bright in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2201.jpg" +"2202" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2202.jpg" +"2203" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2203.jpg" +"2204" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2204.jpg" +"2205" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2205.jpg" +"2206" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2206.jpg" +"2207" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2207.jpg" +"2208" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2208.jpg" +"2209" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2209.jpg" +"2210" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2210.jpg" +"2211" "Are there two cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2211.jpg" +"2212" "Are there three cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2212.jpg" +"2213" "Is the desert yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2213.jpg" +"2214" "Is the desert blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2214.jpg" +"2215" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2215.jpg" +"2216" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2216.jpg" +"2217" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2217.jpg" +"2218" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2218.jpg" +"2219" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2219.jpg" +"2220" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2220.jpg" +"2221" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2221.jpg" +"2222" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2222.jpg" +"2223" "Is there one basket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2223.jpg" +"2224" "Are there two baskets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2224.jpg" +"2225" "Is the blanket red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2225.jpg" +"2226" "Is the blanket black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2226.jpg" +"2227" "Are there two candles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2227.jpg" +"2228" "Are there three candles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2228.jpg" +"2229" "Is the balloon colorful in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2229.jpg" +"2230" "Is the balloon monochromatic in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2230.jpg" +"2231" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2231.jpg" +"2232" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2232.jpg" +"2233" "Is there one volleyball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2233.jpg" +"2234" "Are there two volleyballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2234.jpg" +"2235" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2235.jpg" +"2236" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2236.jpg" +"2237" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2237.jpg" +"2238" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2238.jpg" +"2239" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2239.jpg" +"2240" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2240.jpg" +"2241" "Is the floor yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2241.jpg" +"2242" "Is the floor white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2242.jpg" +"2243" "Is the ribbon messy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2243.jpg" +"2244" "Is the ribbon tidy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2244.jpg" +"2245" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2245.jpg" +"2246" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2246.jpg" +"2247" "Is there one basketball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2247.jpg" +"2248" "Are there three basketballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2248.jpg" +"2249" "Is there one basketball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2249.jpg" +"2250" "Are there two basketballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2250.jpg" +"2251" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2251.jpg" +"2252" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2252.jpg" +"2253" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2253.jpg" +"2254" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2254.jpg" +"2255" "Does the child play soccer in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2255.jpg" +"2256" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2256.jpg" +"2257" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2257.jpg" +"2258" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2258.jpg" +"2259" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2259.jpg" +"2260" "Is the cloud blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2260.jpg" +"2261" "Does the person jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2261.jpg" +"2262" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2262.jpg" +"2263" "Is there one basketball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2263.jpg" +"2264" "Are there two basketballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2264.jpg" +"2265" "Is there one support in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2265.jpg" +"2266" "Are there two supports in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2266.jpg" +"2267" "Is there one bed in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2267.jpg" +"2268" "Are there two beds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2268.jpg" +"2269" "Is the mattress white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2269.jpg" +"2270" "Is the mattress black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2270.jpg" +"2271" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2271.jpg" +"2272" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2272.jpg" +"2273" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2273.jpg" +"2274" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2274.jpg" +"2275" "Are there four eggs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2275.jpg" +"2276" "Are there six eggs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2276.jpg" +"2277" "Is the tablecloth white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2277.jpg" +"2278" "Is the tablecloth black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2278.jpg" +"2279" "Is the blueberry blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2279.jpg" +"2280" "Is the blueberry white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2280.jpg" +"2281" "Is there one scoon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2281.jpg" +"2282" "Are there two scoons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2282.jpg" +"2283" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2283.jpg" +"2284" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2284.jpg" +"2285" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2285.jpg" +"2286" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2286.jpg" +"2287" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2287.jpg" +"2288" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2288.jpg" +"2289" "Is the sea rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2289.jpg" +"2290" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2290.jpg" +"2291" "Are there two ships in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2291.jpg" +"2292" "Are there three ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2292.jpg" +"2293" "Is the river calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2293.jpg" +"2294" "Is the river rolling in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2294.jpg" +"2295" "Is the book neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2295.jpg" +"2296" "Is the book messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2296.jpg" +"2297" "Is the bookshelf clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2297.jpg" +"2298" "Is the bookshelf dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2298.jpg" +"2299" "Is the book open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2299.jpg" +"2300" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2300.jpg" +"2301" "Is the table wooden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2301.jpg" +"2302" "Is the table tiled in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2302.jpg" +"2303" "Is the wall blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2303.jpg" +"2304" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2304.jpg" +"2305" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2305.jpg" +"2306" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2306.jpg" +"2307" "Is the broccoli green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2307.jpg" +"2308" "Is the broccoli blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2308.jpg" +"2309" "Are there two lemons in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2309.jpg" +"2310" "Are there three lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2310.jpg" +"2311" "Is the melon separated in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2311.jpg" +"2312" "Is the melon complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2312.jpg" +"2313" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2313.jpg" +"2314" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2314.jpg" +"2315" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2315.jpg" +"2316" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2316.jpg" +"2317" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2317.jpg" +"2318" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2318.jpg" +"2319" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2319.jpg" +"2320" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2320.jpg" +"2321" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2321.jpg" +"2322" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2322.jpg" +"2323" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2323.jpg" +"2324" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2324.jpg" +"2325" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2325.jpg" +"2326" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2326.jpg" +"2327" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2327.jpg" +"2328" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2328.jpg" +"2329" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2329.jpg" +"2330" "Does the cat sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2330.jpg" +"2331" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2331.jpg" +"2332" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2332.jpg" +"2333" "Are there two lounges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2333.jpg" +"2334" "Are there three lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2334.jpg" +"2335" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2335.jpg" +"2336" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2336.jpg" +"2337" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2337.jpg" +"2338" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2338.jpg" +"2339" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2339.jpg" +"2340" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2340.jpg" +"2341" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2341.jpg" +"2342" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2342.jpg" +"2343" "Is there one chicken in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2343.jpg" +"2344" "Are there two chickens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2344.jpg" +"2345" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2345.jpg" +"2346" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2346.jpg" +"2347" "Does the chicken stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2347.jpg" +"2348" "Does the chicken run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2348.jpg" +"2349" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2349.jpg" +"2350" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2350.jpg" +"2351" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2351.jpg" +"2352" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2352.jpg" +"2353" "Does the man strike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2353.jpg" +"2354" "Does the man jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2354.jpg" +"2355" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2355.jpg" +"2356" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2356.jpg" +"2357" "Is the ball white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2357.jpg" +"2358" "Is the ball black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2358.jpg" +"2359" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2359.jpg" +"2360" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2360.jpg" +"2361" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2361.jpg" +"2362" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2362.jpg" +"2363" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2363.jpg" +"2364" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2364.jpg" +"2365" "Does the cow eat in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2365.jpg" +"2366" "Does the cow run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2366.jpg" +"2367" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2367.jpg" +"2368" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2368.jpg" +"2369" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2369.jpg" +"2370" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2370.jpg" +"2371" "Is the sky gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2371.jpg" +"2372" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2372.jpg" +"2373" "Is the sea turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2373.jpg" +"2374" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2374.jpg" +"2375" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2375.jpg" +"2376" "Is the keyboard black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2376.jpg" +"2377" "Is the table brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2377.jpg" +"2378" "Is the table yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2378.jpg" +"2379" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2379.jpg" +"2380" "Are there three mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2380.jpg" +"2381" "Is the mousepad black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2381.jpg" +"2382" "Is the mousepad red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2382.jpg" +"2383" "Is the toy brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2383.jpg" +"2384" "Is the toy red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2384.jpg" +"2385" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2385.jpg" +"2386" "Are there five chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2386.jpg" +"2387" "Are there five bananas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2387.jpg" +"2388" "Are there six bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2388.jpg" +"2389" "Does the cat raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2389.jpg" +"2390" "Does the cat lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2390.jpg" +"2391" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2391.jpg" +"2392" "Is the bath black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2392.jpg" +"2393" "Is there one bucket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2393.jpg" +"2394" "Are there three buckets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2394.jpg" +"2395" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2395.jpg" +"2396" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2396.jpg" +"2397" "Does the dog lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2397.jpg" +"2398" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2398.jpg" +"2399" "Is the bear brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2399.jpg" +"2400" "Is the bear yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2400.jpg" +"2401" "Does the plane run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2401.jpg" +"2402" "Does the plane stop in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2402.jpg" +"2403" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2403.jpg" +"2404" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2404.jpg" +"2405" "Is the grass yellow-green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2405.jpg" +"2406" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2406.jpg" +"2407" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2407.jpg" +"2408" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2408.jpg" +"2409" "Are there two cows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2409.jpg" +"2410" "Are there three cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2410.jpg" +"2411" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2411.jpg" +"2412" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2412.jpg" +"2413" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2413.jpg" +"2414" "Does the person crouch in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2414.jpg" +"2415" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2415.jpg" +"2416" "Is the sea motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2416.jpg" +"2417" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2417.jpg" +"2418" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2418.jpg" +"2419" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2419.jpg" +"2420" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2420.jpg" +"2421" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2421.jpg" +"2422" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2422.jpg" +"2423" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2423.jpg" +"2424" "Is the sea motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2424.jpg" +"2425" "Is there one wineglass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2425.jpg" +"2426" "Are there two wineglasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2426.jpg" +"2427" "Is there one alarm in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2427.jpg" +"2428" "Are there two alarms in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2428.jpg" +"2429" "Is there one book in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2429.jpg" +"2430" "Are there three books in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2430.jpg" +"2431" "Does the person skiing in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2431.jpg" +"2432" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2432.jpg" +"2433" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2433.jpg" +"2434" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2434.jpg" +"2435" "Does the woman laugh in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2435.jpg" +"2436" "Does the woman cry in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2436.jpg" +"2437" "Is the phone silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2437.jpg" +"2438" "Is the phone green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2438.jpg" +"2439" "Is the frisbee blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2439.jpg" +"2440" "Is the frisbee black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2440.jpg" +"2441" "Does the dog jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2441.jpg" +"2442" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2442.jpg" +"2443" "Is the train yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2443.jpg" +"2444" "Is the train green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2444.jpg" +"2445" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2445.jpg" +"2446" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2446.jpg" +"2447" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2447.jpg" +"2448" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2448.jpg" +"2449" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2449.jpg" +"2450" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2450.jpg" +"2451" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2451.jpg" +"2452" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2452.jpg" +"2453" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2453.jpg" +"2454" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2454.jpg" +"2455" "Does the plane fly in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2455.jpg" +"2456" "Does the plane slide in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2456.jpg" +"2457" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2457.jpg" +"2458" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2458.jpg" +"2459" "Does the cat sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2459.jpg" +"2460" "Does the cat run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2460.jpg" +"2461" "Is the hat green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2461.jpg" +"2462" "Is the hat blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2462.jpg" +"2463" "Is the wall black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2463.jpg" +"2464" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2464.jpg" +"2465" "Is the ship white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2465.jpg" +"2466" "Is the ship red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2466.jpg" +"2467" "Are there two cows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2467.jpg" +"2468" "Are there five cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2468.jpg" +"2469" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2469.jpg" +"2470" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2470.jpg" +"2471" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2471.jpg" +"2472" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2472.jpg" +"2473" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2473.jpg" +"2474" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2474.jpg" +"2475" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2475.jpg" +"2476" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2476.jpg" +"2477" "Does the bird stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2477.jpg" +"2478" "Does the bird sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2478.jpg" +"2479" "Is the sky gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2479.jpg" +"2480" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2480.jpg" +"2481" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2481.jpg" +"2482" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2482.jpg" +"2483" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2483.jpg" +"2484" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2484.jpg" +"2485" "Is there one tie in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2485.jpg" +"2486" "Are there two ties in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2486.jpg" +"2487" "Does the bird stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2487.jpg" +"2488" "Does the bird fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2488.jpg" +"2489" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2489.jpg" +"2490" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2490.jpg" +"2491" "Is the leave green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2491.jpg" +"2492" "Is the leave yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2492.jpg" +"2493" "Does the person upside down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2493.jpg" +"2494" "Does the person standing in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2494.jpg" +"2495" "Are there two skates in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2495.jpg" +"2496" "Are there three skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2496.jpg" +"2497" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2497.jpg" +"2498" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2498.jpg" +"2499" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2499.jpg" +"2500" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2500.jpg" +"2501" "Is the sea restless in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2501.jpg" +"2502" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2502.jpg" +"2503" "Is the note yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2503.jpg" +"2504" "Is the note black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2504.jpg" +"2505" "Is there one microwave in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2505.jpg" +"2506" "Are there two microwaves in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2506.jpg" +"2507" "Is the cabinet suspended in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2507.jpg" +"2508" "Is the cabinet grounded in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2508.jpg" +"2509" "Are there two cups in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2509.jpg" +"2510" "Are there four cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2510.jpg" +"2511" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2511.jpg" +"2512" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2512.jpg" +"2513" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2513.jpg" +"2514" "Is the forest yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2514.jpg" +"2515" "Are there two zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2515.jpg" +"2516" "Are there five zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2516.jpg" +"2517" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2517.jpg" +"2518" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2518.jpg" +"2519" "Does the sea peaceful in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2519.jpg" +"2520" "Does the sea turbulent in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2520.jpg" +"2521" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2521.jpg" +"2522" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2522.jpg" +"2523" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2523.jpg" +"2524" "Are there three ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2524.jpg" +"2525" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2525.jpg" +"2526" "Is the sky yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2526.jpg" +"2527" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2527.jpg" +"2528" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2528.jpg" +"2529" "Are there three phones in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2529.jpg" +"2530" "Are there four phones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2530.jpg" +"2531" "Is the notebook open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2531.jpg" +"2532" "Is the notebook closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2532.jpg" +"2533" "Are there two oranges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2533.jpg" +"2534" "Are there six oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2534.jpg" +"2535" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2535.jpg" +"2536" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2536.jpg" +"2537" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2537.jpg" +"2538" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2538.jpg" +"2539" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2539.jpg" +"2540" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2540.jpg" +"2541" "Is there one alarm in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2541.jpg" +"2542" "Are there three alarms in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2542.jpg" +"2543" "Is the quilt white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2543.jpg" +"2544" "Is the quilt black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2544.jpg" +"2545" "Is the pillow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2545.jpg" +"2546" "Is the pillow blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2546.jpg" +"2547" "Are there two elephants in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2547.jpg" +"2548" "Are there six elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2548.jpg" +"2549" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2549.jpg" +"2550" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2550.jpg" +"2551" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2551.jpg" +"2552" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2552.jpg" +"2553" "Does the woman play ball in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2553.jpg" +"2554" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2554.jpg" +"2555" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2555.jpg" +"2556" "Are there three rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2556.jpg" +"2557" "Is the ground deep blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2557.jpg" +"2558" "Is the ground white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2558.jpg" +"2559" "Does the electrombile motionless in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2559.jpg" +"2560" "Does the electrombile cycling in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2560.jpg" +"2561" "Is the wall natural wood in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2561.jpg" +"2562" "Is the wall concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2562.jpg" +"2563" "Is the ground gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2563.jpg" +"2564" "Is the ground white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2564.jpg" +"2565" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2565.jpg" +"2566" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2566.jpg" +"2567" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2567.jpg" +"2568" "Are there three rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2568.jpg" +"2569" "Is the ball yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2569.jpg" +"2570" "Is the ball red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2570.jpg" +"2571" "Is the ground red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2571.jpg" +"2572" "Is the ground white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2572.jpg" +"2573" "Is there one drawing in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2573.jpg" +"2574" "Are there three drawings in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2574.jpg" +"2575" "Does the lamp open in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2575.jpg" +"2576" "Does the lamp closed in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2576.jpg" +"2577" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2577.jpg" +"2578" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2578.jpg" +"2579" "Is the pillow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2579.jpg" +"2580" "Is the pillow gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2580.jpg" +"2581" "Is the quilt white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2581.jpg" +"2582" "Is the quilt red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2582.jpg" +"2583" "Are there two chairs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2583.jpg" +"2584" "Are there four chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2584.jpg" +"2585" "Is the table brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2585.jpg" +"2586" "Is the table white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2586.jpg" +"2587" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2587.jpg" +"2588" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2588.jpg" +"2589" "Is there one tire in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2589.jpg" +"2590" "Are there four tires in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2590.jpg" +"2591" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2591.jpg" +"2592" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2592.jpg" +"2593" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2593.jpg" +"2594" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2594.jpg" +"2595" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2595.jpg" +"2596" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2596.jpg" +"2597" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2597.jpg" +"2598" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2598.jpg" +"2599" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2599.jpg" +"2600" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2600.jpg" +"2601" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2601.jpg" +"2602" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2602.jpg" +"2603" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2603.jpg" +"2604" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2604.jpg" +"2605" "Is the luggage black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2605.jpg" +"2606" "Is the luggage red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2606.jpg" +"2607" "Are there two benches in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2607.jpg" +"2608" "Are there five benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2608.jpg" +"2609" "Does the woman sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2609.jpg" +"2610" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2610.jpg" +"2611" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2611.jpg" +"2612" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2612.jpg" +"2613" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2613.jpg" +"2614" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2614.jpg" +"2615" "Is there one bus in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2615.jpg" +"2616" "Are there two buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2616.jpg" +"2617" "Is the house red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2617.jpg" +"2618" "Is the house blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2618.jpg" +"2619" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2619.jpg" +"2620" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2620.jpg" +"2621" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2621.jpg" +"2622" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2622.jpg" +"2623" "Are there three birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2623.jpg" +"2624" "Are there nine birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2624.jpg" +"2625" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2625.jpg" +"2626" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2626.jpg" +"2627" "Is the river sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2627.jpg" +"2628" "Is the river calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2628.jpg" +"2629" "Is there one elephant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2629.jpg" +"2630" "Are there three elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2630.jpg" +"2631" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2631.jpg" +"2632" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2632.jpg" +"2633" "Is the tree withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2633.jpg" +"2634" "Is the tree lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2634.jpg" +"2635" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2635.jpg" +"2636" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2636.jpg" +"2637" "Is the sound black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2637.jpg" +"2638" "Is the sound pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2638.jpg" +"2639" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2639.jpg" +"2640" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2640.jpg" +"2641" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2641.jpg" +"2642" "Are there three cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2642.jpg" +"2643" "Is there one socket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2643.jpg" +"2644" "Are there four sockets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2644.jpg" +"2645" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2645.jpg" +"2646" "Is the wall yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2646.jpg" +"2647" "Are there two drawings in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2647.jpg" +"2648" "Are there three drawings in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2648.jpg" +"2649" "Is the table messy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2649.jpg" +"2650" "Is the table neat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2650.jpg" +"2651" "Does the bear lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2651.jpg" +"2652" "Does the bear stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2652.jpg" +"2653" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2653.jpg" +"2654" "Are there three trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2654.jpg" +"2655" "Is the sign red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2655.jpg" +"2656" "Is the sign black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2656.jpg" +"2657" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2657.jpg" +"2658" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2658.jpg" +"2659" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2659.jpg" +"2660" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2660.jpg" +"2661" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2661.jpg" +"2662" "Is the forest blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2662.jpg" +"2663" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2663.jpg" +"2664" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2664.jpg" +"2665" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2665.jpg" +"2666" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2666.jpg" +"2667" "Is there one vase in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2667.jpg" +"2668" "Are there two vases in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2668.jpg" +"2669" "Is the flower fresh in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2669.jpg" +"2670" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2670.jpg" +"2671" "Are there two elephants in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2671.jpg" +"2672" "Are there three elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2672.jpg" +"2673" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2673.jpg" +"2674" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2674.jpg" +"2675" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2675.jpg" +"2676" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2676.jpg" +"2677" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2677.jpg" +"2678" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2678.jpg" +"2679" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2679.jpg" +"2680" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2680.jpg" +"2681" "Does the person play ball in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2681.jpg" +"2682" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2682.jpg" +"2683" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2683.jpg" +"2684" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2684.jpg" +"2685" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2685.jpg" +"2686" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2686.jpg" +"2687" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2687.jpg" +"2688" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2688.jpg" +"2689" "Is the water murky in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2689.jpg" +"2690" "Is the water clear in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2690.jpg" +"2691" "Does the person cycling in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2691.jpg" +"2692" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2692.jpg" +"2693" "Are there three horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2693.jpg" +"2694" "Are there four horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2694.jpg" +"2695" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2695.jpg" +"2696" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2696.jpg" +"2697" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2697.jpg" +"2698" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2698.jpg" +"2699" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2699.jpg" +"2700" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2700.jpg" +"2701" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2701.jpg" +"2702" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2702.jpg" +"2703" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2703.jpg" +"2704" "Is the snow pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2704.jpg" +"2705" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2705.jpg" +"2706" "Are there five planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2706.jpg" +"2707" "Does the bird lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2707.jpg" +"2708" "Does the bird fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2708.jpg" +"2709" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2709.jpg" +"2710" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2710.jpg" +"2711" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2711.jpg" +"2712" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2712.jpg" +"2713" "Does the bird stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2713.jpg" +"2714" "Does the bird fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2714.jpg" +"2715" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2715.jpg" +"2716" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2716.jpg" +"2717" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2717.jpg" +"2718" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2718.jpg" +"2719" "Is the television small-sized in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2719.jpg" +"2720" "Is the television large-sized in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2720.jpg" +"2721" "Is the box silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2721.jpg" +"2722" "Is the box black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2722.jpg" +"2723" "Is the cabinet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2723.jpg" +"2724" "Is the cabinet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2724.jpg" +"2725" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2725.jpg" +"2726" "Are there two tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2726.jpg" +"2727" "Is there one sofa in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2727.jpg" +"2728" "Are there two sofas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2728.jpg" +"2729" "Is the floor brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2729.jpg" +"2730" "Is the floor gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2730.jpg" +"2731" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2731.jpg" +"2732" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2732.jpg" +"2733" "Is the sunflower fresh in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2733.jpg" +"2734" "Is the sunflower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2734.jpg" +"2735" "Is the vase white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2735.jpg" +"2736" "Is the vase black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2736.jpg" +"2737" "Is the wall reddish-brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2737.jpg" +"2738" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2738.jpg" +"2739" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2739.jpg" +"2740" "Is the plate blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2740.jpg" +"2741" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2741.jpg" +"2742" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2742.jpg" +"2743" "Does the cat raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2743.jpg" +"2744" "Does the cat lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2744.jpg" +"2745" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2745.jpg" +"2746" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2746.jpg" +"2747" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2747.jpg" +"2748" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2748.jpg" +"2749" "Does the dog jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2749.jpg" +"2750" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2750.jpg" +"2751" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2751.jpg" +"2752" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2752.jpg" +"2753" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2753.jpg" +"2754" "Are there three toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2754.jpg" +"2755" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2755.jpg" +"2756" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2756.jpg" +"2757" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2757.jpg" +"2758" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2758.jpg" +"2759" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2759.jpg" +"2760" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2760.jpg" +"2761" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2761.jpg" +"2762" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2762.jpg" +"2763" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2763.jpg" +"2764" "Is the sink gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2764.jpg" +"2765" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2765.jpg" +"2766" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2766.jpg" +"2767" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2767.jpg" +"2768" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2768.jpg" +"2769" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2769.jpg" +"2770" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2770.jpg" +"2771" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2771.jpg" +"2772" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2772.jpg" +"2773" "Is the sea restless in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2773.jpg" +"2774" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2774.jpg" +"2775" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2775.jpg" +"2776" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2776.jpg" +"2777" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2777.jpg" +"2778" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2778.jpg" +"2779" "Does the bear walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2779.jpg" +"2780" "Does the bear sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2780.jpg" +"2781" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2781.jpg" +"2782" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2782.jpg" +"2783" "Is the flower yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2783.jpg" +"2784" "Is the flower red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2784.jpg" +"2785" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2785.jpg" +"2786" "Is the snow green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2786.jpg" +"2787" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2787.jpg" +"2788" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2788.jpg" +"2789" "Does the person skiing in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2789.jpg" +"2790" "Does the person hike in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2790.jpg" +"2791" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2791.jpg" +"2792" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2792.jpg" +"2793" "Is the phone open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2793.jpg" +"2794" "Is the phone closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2794.jpg" +"2795" "Are there three monies in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2795.jpg" +"2796" "Are there six monies in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2796.jpg" +"2797" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2797.jpg" +"2798" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2798.jpg" +"2799" "Does the cat raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2799.jpg" +"2800" "Does the cat lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2800.jpg" +"2801" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2801.jpg" +"2802" "Are there six toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2802.jpg" +"2803" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2803.jpg" +"2804" "Is the wall pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2804.jpg" +"2805" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2805.jpg" +"2806" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2806.jpg" +"2807" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2807.jpg" +"2808" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2808.jpg" +"2809" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2809.jpg" +"2810" "Is the forest white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2810.jpg" +"2811" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2811.jpg" +"2812" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2812.jpg" +"2813" "Does the cat sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2813.jpg" +"2814" "Does the cat run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2814.jpg" +"2815" "Is the wall yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2815.jpg" +"2816" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2816.jpg" +"2817" "Is there one alarm in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2817.jpg" +"2818" "Are there three alarms in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2818.jpg" +"2819" "Is the bookshelf neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2819.jpg" +"2820" "Is the bookshelf messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2820.jpg" +"2821" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2821.jpg" +"2822" "Is the tree blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2822.jpg" +"2823" "Is there one sign in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2823.jpg" +"2824" "Are there two signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2824.jpg" +"2825" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2825.jpg" +"2826" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2826.jpg" +"2827" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2827.jpg" +"2828" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2828.jpg" +"2829" "Is there one shoe in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2829.jpg" +"2830" "Are there three shoes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2830.jpg" +"2831" "Is the floor khaki in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2831.jpg" +"2832" "Is the floor white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2832.jpg" +"2833" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2833.jpg" +"2834" "Are there five benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2834.jpg" +"2835" "Is the sailing white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2835.jpg" +"2836" "Is the sailing blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2836.jpg" +"2837" "Is the island large in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2837.jpg" +"2838" "Is the island small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2838.jpg" +"2839" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2839.jpg" +"2840" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2840.jpg" +"2841" "Is the lake calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2841.jpg" +"2842" "Is the lake restless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2842.jpg" +"2843" "Does the cat raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2843.jpg" +"2844" "Does the cat lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2844.jpg" +"2845" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2845.jpg" +"2846" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2846.jpg" +"2847" "Does the giraffe stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2847.jpg" +"2848" "Does the giraffe lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2848.jpg" +"2849" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2849.jpg" +"2850" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2850.jpg" +"2851" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2851.jpg" +"2852" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2852.jpg" +"2853" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2853.jpg" +"2854" "Is the forest black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2854.jpg" +"2855" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2855.jpg" +"2856" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2856.jpg" +"2857" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2857.jpg" +"2858" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2858.jpg" +"2859" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2859.jpg" +"2860" "Are there three kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2860.jpg" +"2861" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2861.jpg" +"2862" "Is the cloud green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2862.jpg" +"2863" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2863.jpg" +"2864" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2864.jpg" +"2865" "Is the ground wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2865.jpg" +"2866" "Is the ground narrow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2866.jpg" +"2867" "Does the man run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2867.jpg" +"2868" "Does the man lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2868.jpg" +"2869" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2869.jpg" +"2870" "Are there three footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2870.jpg" +"2871" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2871.jpg" +"2872" "Is the tree white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2872.jpg" +"2873" "Is the house short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2873.jpg" +"2874" "Is the house tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2874.jpg" +"2875" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2875.jpg" +"2876" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2876.jpg" +"2877" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2877.jpg" +"2878" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2878.jpg" +"2879" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2879.jpg" +"2880" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2880.jpg" +"2881" "Is the river sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2881.jpg" +"2882" "Is the river calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2882.jpg" +"2883" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2883.jpg" +"2884" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2884.jpg" +"2885" "Is the bridge long in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2885.jpg" +"2886" "Is the bridge short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2886.jpg" +"2887" "Is the forest withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2887.jpg" +"2888" "Is the forest lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2888.jpg" +"2889" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2889.jpg" +"2890" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2890.jpg" +"2891" "Is there one sign in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2891.jpg" +"2892" "Are there two signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2892.jpg" +"2893" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2893.jpg" +"2894" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2894.jpg" +"2895" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2895.jpg" +"2896" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2896.jpg" +"2897" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2897.jpg" +"2898" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2898.jpg" +"2899" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2899.jpg" +"2900" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2900.jpg" +"2901" "Is the door open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2901.jpg" +"2902" "Is the door closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2902.jpg" +"2903" "Is the lock gold in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2903.jpg" +"2904" "Is the lock silver in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2904.jpg" +"2905" "Is the wall yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2905.jpg" +"2906" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2906.jpg" +"2907" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2907.jpg" +"2908" "Is the toilet gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2908.jpg" +"2909" "Does the person skiing in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2909.jpg" +"2910" "Does the person lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2910.jpg" +"2911" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2911.jpg" +"2912" "Is the snow green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2912.jpg" +"2913" "Is there one snowboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2913.jpg" +"2914" "Are there two snowboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2914.jpg" +"2915" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2915.jpg" +"2916" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2916.jpg" +"2917" "Is the umbrella red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2917.jpg" +"2918" "Is the umbrella green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2918.jpg" +"2919" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2919.jpg" +"2920" "Is the sky red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2920.jpg" +"2921" "Is the sea gentle waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2921.jpg" +"2922" "Is the sea raging waves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2922.jpg" +"2923" "Is there one zebra in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2923.jpg" +"2924" "Are there three zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2924.jpg" +"2925" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2925.jpg" +"2926" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2926.jpg" +"2927" "Is the telephone square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2927.jpg" +"2928" "Is the telephone round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2928.jpg" +"2929" "Is the mouse black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2929.jpg" +"2930" "Is the mouse pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2930.jpg" +"2931" "Is the keyboard black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2931.jpg" +"2932" "Is the keyboard silver in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2932.jpg" +"2933" "Is there one mousepad in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2933.jpg" +"2934" "Are there three mousepads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2934.jpg" +"2935" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2935.jpg" +"2936" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2936.jpg" +"2937" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2937.jpg" +"2938" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2938.jpg" +"2939" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2939.jpg" +"2940" "Are there five chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2940.jpg" +"2941" "Is the wall yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2941.jpg" +"2942" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2942.jpg" +"2943" "Is the extinguisher red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2943.jpg" +"2944" "Is the extinguisher green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2944.jpg" +"2945" "Is the chair silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2945.jpg" +"2946" "Is the chair yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2946.jpg" +"2947" "Is the wall natural wood in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2947.jpg" +"2948" "Is the wall concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2948.jpg" +"2949" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2949.jpg" +"2950" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2950.jpg" +"2951" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2951.jpg" +"2952" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2952.jpg" +"2953" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2953.jpg" +"2954" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2954.jpg" +"2955" "Is the sea calm waters in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2955.jpg" +"2956" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2956.jpg" +"2957" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2957.jpg" +"2958" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2958.jpg" +"2959" "Are there two taps in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2959.jpg" +"2960" "Are there four taps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2960.jpg" +"2961" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2961.jpg" +"2962" "Is the bath yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2962.jpg" +"2963" "Is the wall tiled in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2963.jpg" +"2964" "Is the wall concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2964.jpg" +"2965" "Is the floor tiled in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2965.jpg" +"2966" "Is the floor wooden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2966.jpg" +"2967" "Does the dog walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2967.jpg" +"2968" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2968.jpg" +"2969" "Is the ground tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2969.jpg" +"2970" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2970.jpg" +"2971" "Is the wall uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2971.jpg" +"2972" "Is the wall smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2972.jpg" +"2973" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2973.jpg" +"2974" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2974.jpg" +"2975" "Are there two snowboards in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2975.jpg" +"2976" "Are there four snowboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2976.jpg" +"2977" "Are there two poles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2977.jpg" +"2978" "Are there four poles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2978.jpg" +"2979" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2979.jpg" +"2980" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2980.jpg" +"2981" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2981.jpg" +"2982" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2982.jpg" +"2983" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2983.jpg" +"2984" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2984.jpg" +"2985" "Is the television open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2985.jpg" +"2986" "Is the television closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2986.jpg" +"2987" "Does the cat raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2987.jpg" +"2988" "Does the cat lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2988.jpg" +"2989" "Is the cabinet grounded in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2989.jpg" +"2990" "Is the cabinet suspended in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2990.jpg" +"2991" "Is the carpet gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2991.jpg" +"2992" "Is the carpet red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2992.jpg" +"2993" "Is the box standing in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2993.jpg" +"2994" "Is the box flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2994.jpg" +"2995" "Is the curtain tight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2995.jpg" +"2996" "Is the curtain spread out in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2996.jpg" +"2997" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2997.jpg" +"2998" "Is the wall green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2998.jpg" +"2999" "Are there three cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/2999.jpg" +"3000" "Are there four cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3000.jpg" +"3001" "Is the bicycle upright in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3001.jpg" +"3002" "Is the bicycle tilted in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3002.jpg" +"3003" "Is the road smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3003.jpg" +"3004" "Is the road uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3004.jpg" +"3005" "Is the phone open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3005.jpg" +"3006" "Is the phone closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3006.jpg" +"3007" "Is the monitor open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3007.jpg" +"3008" "Is the monitor closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3008.jpg" +"3009" "Does the bird fly in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3009.jpg" +"3010" "Does the bird stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3010.jpg" +"3011" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3011.jpg" +"3012" "Is the sea turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3012.jpg" +"3013" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3013.jpg" +"3014" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3014.jpg" +"3015" "Does the bird stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3015.jpg" +"3016" "Does the bird fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3016.jpg" +"3017" "Is the apple withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3017.jpg" +"3018" "Is the apple plump in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3018.jpg" +"3019" "Is the grass gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3019.jpg" +"3020" "Is the grass green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3020.jpg" +"3021" "Is the wall green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3021.jpg" +"3022" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3022.jpg" +"3023" "Is there one lamp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3023.jpg" +"3024" "Are there four lamps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3024.jpg" +"3025" "Does the cat sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3025.jpg" +"3026" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3026.jpg" +"3027" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3027.jpg" +"3028" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3028.jpg" +"3029" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3029.jpg" +"3030" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3030.jpg" +"3031" "Does the horse walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3031.jpg" +"3032" "Does the horse run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3032.jpg" +"3033" "Does the woman sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3033.jpg" +"3034" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3034.jpg" +"3035" "Is the forest emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3035.jpg" +"3036" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3036.jpg" +"3037" "Does the giraffe stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3037.jpg" +"3038" "Does the giraffe run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3038.jpg" +"3039" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3039.jpg" +"3040" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3040.jpg" +"3041" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3041.jpg" +"3042" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3042.jpg" +"3043" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3043.jpg" +"3044" "Is the cloud blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3044.jpg" +"3045" "Is the sea spectacular in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3045.jpg" +"3046" "Is the sea blue seas and clear skies in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3046.jpg" +"3047" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3047.jpg" +"3048" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3048.jpg" +"3049" "Are there three benches in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3049.jpg" +"3050" "Are there four benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3050.jpg" +"3051" "Is the grass sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3051.jpg" +"3052" "Is the grass lush in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3052.jpg" +"3053" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3053.jpg" +"3054" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3054.jpg" +"3055" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3055.jpg" +"3056" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3056.jpg" +"3057" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3057.jpg" +"3058" "Is the ground tiled in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3058.jpg" +"3059" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3059.jpg" +"3060" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3060.jpg" +"3061" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3061.jpg" +"3062" "Is the mountain low in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3062.jpg" +"3063" "Does the plane stop in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3063.jpg" +"3064" "Does the plane fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3064.jpg" +"3065" "Is the backpack green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3065.jpg" +"3066" "Is the backpack white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3066.jpg" +"3067" "Is the luggage red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3067.jpg" +"3068" "Is the luggage silver in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3068.jpg" +"3069" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3069.jpg" +"3070" "Are there three chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3070.jpg" +"3071" "Does the kite fly in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3071.jpg" +"3072" "Does the kite lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3072.jpg" +"3073" "Is there one line in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3073.jpg" +"3074" "Are there three lines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3074.jpg" +"3075" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3075.jpg" +"3076" "Is the sky red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3076.jpg" +"3077" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3077.jpg" +"3078" "Is the cloud green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3078.jpg" +"3079" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3079.jpg" +"3080" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3080.jpg" +"3081" "Are there two signs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3081.jpg" +"3082" "Are there four signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3082.jpg" +"3083" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3083.jpg" +"3084" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3084.jpg" +"3085" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3085.jpg" +"3086" "Are there three planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3086.jpg" +"3087" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3087.jpg" +"3088" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3088.jpg" +"3089" "Is the cloud gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3089.jpg" +"3090" "Is the cloud white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3090.jpg" +"3091" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3091.jpg" +"3092" "Are there five cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3092.jpg" +"3093" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3093.jpg" +"3094" "Is the mountain low in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3094.jpg" +"3095" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3095.jpg" +"3096" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3096.jpg" +"3097" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3097.jpg" +"3098" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3098.jpg" +"3099" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3099.jpg" +"3100" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3100.jpg" +"3101" "Is the forest verdant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3101.jpg" +"3102" "Is the forest barren in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3102.jpg" +"3103" "Is the car red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3103.jpg" +"3104" "Is the car white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3104.jpg" +"3105" "Is the road muddy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3105.jpg" +"3106" "Is the road concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3106.jpg" +"3107" "Is there one sign in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3107.jpg" +"3108" "Are there three signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3108.jpg" +"3109" "Are there two bears in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3109.jpg" +"3110" "Are there five bears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3110.jpg" +"3111" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3111.jpg" +"3112" "Is the snow green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3112.jpg" +"3113" "Is the sea calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3113.jpg" +"3114" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3114.jpg" +"3115" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3115.jpg" +"3116" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3116.jpg" +"3117" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3117.jpg" +"3118" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3118.jpg" +"3119" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3119.jpg" +"3120" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3120.jpg" +"3121" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3121.jpg" +"3122" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3122.jpg" +"3123" "Does the person cycling in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3123.jpg" +"3124" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3124.jpg" +"3125" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3125.jpg" +"3126" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3126.jpg" +"3127" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3127.jpg" +"3128" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3128.jpg" +"3129" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3129.jpg" +"3130" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3130.jpg" +"3131" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3131.jpg" +"3132" "Does the man lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3132.jpg" +"3133" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3133.jpg" +"3134" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3134.jpg" +"3135" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3135.jpg" +"3136" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3136.jpg" +"3137" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3137.jpg" +"3138" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3138.jpg" +"3139" "Is the phone open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3139.jpg" +"3140" "Is the phone closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3140.jpg" +"3141" "Is there one ebook in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3141.jpg" +"3142" "Are there two ebooks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3142.jpg" +"3143" "Is the sky golden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3143.jpg" +"3144" "Is the sky green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3144.jpg" +"3145" "Are there two seegulls in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3145.jpg" +"3146" "Are there six seegulls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3146.jpg" +"3147" "Is the sea endless in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3147.jpg" +"3148" "Is the sea surrounded by water in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3148.jpg" +"3149" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3149.jpg" +"3150" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3150.jpg" +"3151" "Is the tree sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3151.jpg" +"3152" "Is the tree dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3152.jpg" +"3153" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3153.jpg" +"3154" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3154.jpg" +"3155" "Is the sky bright red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3155.jpg" +"3156" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3156.jpg" +"3157" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3157.jpg" +"3158" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3158.jpg" +"3159" "Does the cat stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3159.jpg" +"3160" "Does the cat sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3160.jpg" +"3161" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3161.jpg" +"3162" "Is the wall uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3162.jpg" +"3163" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3163.jpg" +"3164" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3164.jpg" +"3165" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3165.jpg" +"3166" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3166.jpg" +"3167" "Is the bed neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3167.jpg" +"3168" "Is the bed messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3168.jpg" +"3169" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3169.jpg" +"3170" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3170.jpg" +"3171" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3171.jpg" +"3172" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3172.jpg" +"3173" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3173.jpg" +"3174" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3174.jpg" +"3175" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3175.jpg" +"3176" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3176.jpg" +"3177" "Is the sky gloomy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3177.jpg" +"3178" "Is the sky sunny in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3178.jpg" +"3179" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3179.jpg" +"3180" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3180.jpg" +"3181" "Are there seven lounges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3181.jpg" +"3182" "Are there nine lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3182.jpg" +"3183" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3183.jpg" +"3184" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3184.jpg" +"3185" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3185.jpg" +"3186" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3186.jpg" +"3187" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3187.jpg" +"3188" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3188.jpg" +"3189" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3189.jpg" +"3190" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3190.jpg" +"3191" "Is the car stopped in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3191.jpg" +"3192" "Is the car driving in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3192.jpg" +"3193" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3193.jpg" +"3194" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3194.jpg" +"3195" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3195.jpg" +"3196" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3196.jpg" +"3197" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3197.jpg" +"3198" "Is the cloud green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3198.jpg" +"3199" "Are there two benches in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3199.jpg" +"3200" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3200.jpg" +"3201" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3201.jpg" +"3202" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3202.jpg" +"3203" "Is there one streetlamp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3203.jpg" +"3204" "Are there three streetlamps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3204.jpg" +"3205" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3205.jpg" +"3206" "Is the snow green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3206.jpg" +"3207" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3207.jpg" +"3208" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3208.jpg" +"3209" "Are there two snowboards in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3209.jpg" +"3210" "Are there three snowboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3210.jpg" +"3211" "Are there two poles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3211.jpg" +"3212" "Are there four poles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3212.jpg" +"3213" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3213.jpg" +"3214" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3214.jpg" +"3215" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3215.jpg" +"3216" "Is the cloud green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3216.jpg" +"3217" "Is the grass vast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3217.jpg" +"3218" "Is the grass small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3218.jpg" +"3219" "Is the ground flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3219.jpg" +"3220" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3220.jpg" +"3221" "Does the sheep run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3221.jpg" +"3222" "Does the sheep lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3222.jpg" +"3223" "Is the fence short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3223.jpg" +"3224" "Is the fence tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3224.jpg" +"3225" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3225.jpg" +"3226" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3226.jpg" +"3227" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3227.jpg" +"3228" "Are there three umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3228.jpg" +"3229" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3229.jpg" +"3230" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3230.jpg" +"3231" "Is the computer open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3231.jpg" +"3232" "Is the computer closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3232.jpg" +"3233" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3233.jpg" +"3234" "Are there three keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3234.jpg" +"3235" "Is the table neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3235.jpg" +"3236" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3236.jpg" +"3237" "Is there one kettle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3237.jpg" +"3238" "Are there two kettles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3238.jpg" +"3239" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3239.jpg" +"3240" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3240.jpg" +"3241" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3241.jpg" +"3242" "Does the cat sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3242.jpg" +"3243" "Does the woman lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3243.jpg" +"3244" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3244.jpg" +"3245" "Is there one laptop in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3245.jpg" +"3246" "Are there two laptops in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3246.jpg" +"3247" "Is the quilt white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3247.jpg" +"3248" "Is the quilt black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3248.jpg" +"3249" "Are there two bananas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3249.jpg" +"3250" "Are there three bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3250.jpg" +"3251" "Is the cup white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3251.jpg" +"3252" "Is the cup black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3252.jpg" +"3253" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3253.jpg" +"3254" "Is the plate green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3254.jpg" +"3255" "Is there one scoon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3255.jpg" +"3256" "Are there three scoons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3256.jpg" +"3257" "Is the tablecloth clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3257.jpg" +"3258" "Is the tablecloth dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3258.jpg" +"3259" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3259.jpg" +"3260" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3260.jpg" +"3261" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3261.jpg" +"3262" "Is the cloud green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3262.jpg" +"3263" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3263.jpg" +"3264" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3264.jpg" +"3265" "Is the river shallow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3265.jpg" +"3266" "Is the river deep in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3266.jpg" +"3267" "Does the cow stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3267.jpg" +"3268" "Does the cow lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3268.jpg" +"3269" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3269.jpg" +"3270" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3270.jpg" +"3271" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3271.jpg" +"3272" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3272.jpg" +"3273" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3273.jpg" +"3274" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3274.jpg" +"3275" "Does the person bend in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3275.jpg" +"3276" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3276.jpg" +"3277" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3277.jpg" +"3278" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3278.jpg" +"3279" "Is there one doll in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3279.jpg" +"3280" "Are there two dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3280.jpg" +"3281" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3281.jpg" +"3282" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3282.jpg" +"3283" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3283.jpg" +"3284" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3284.jpg" +"3285" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3285.jpg" +"3286" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3286.jpg" +"3287" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3287.jpg" +"3288" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3288.jpg" +"3289" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3289.jpg" +"3290" "Is the cloud green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3290.jpg" +"3291" "Are there two motorbikes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3291.jpg" +"3292" "Are there four motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3292.jpg" +"3293" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3293.jpg" +"3294" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3294.jpg" +"3295" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3295.jpg" +"3296" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3296.jpg" +"3297" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3297.jpg" +"3298" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3298.jpg" +"3299" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3299.jpg" +"3300" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3300.jpg" +"3301" "Are there two cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3301.jpg" +"3302" "Are there three cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3302.jpg" +"3303" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3303.jpg" +"3304" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3304.jpg" +"3305" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3305.jpg" +"3306" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3306.jpg" +"3307" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3307.jpg" +"3308" "Is the sky green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3308.jpg" +"3309" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3309.jpg" +"3310" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3310.jpg" +"3311" "Is the wall red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3311.jpg" +"3312" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3312.jpg" +"3313" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3313.jpg" +"3314" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3314.jpg" +"3315" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3315.jpg" +"3316" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3316.jpg" +"3317" "Is the bench green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3317.jpg" +"3318" "Is the bench red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3318.jpg" +"3319" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3319.jpg" +"3320" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3320.jpg" +"3321" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3321.jpg" +"3322" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3322.jpg" +"3323" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3323.jpg" +"3324" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3324.jpg" +"3325" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3325.jpg" +"3326" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3326.jpg" +"3327" "Is the wire straight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3327.jpg" +"3328" "Is the wire curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3328.jpg" +"3329" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3329.jpg" +"3330" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3330.jpg" +"3331" "Is the sky overcast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3331.jpg" +"3332" "Is the sky bright in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3332.jpg" +"3333" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3333.jpg" +"3334" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3334.jpg" +"3335" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3335.jpg" +"3336" "Is the tree blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3336.jpg" +"3337" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3337.jpg" +"3338" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3338.jpg" +"3339" "Is the tissue white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3339.jpg" +"3340" "Is the tissue blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3340.jpg" +"3341" "Is there one bin in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3341.jpg" +"3342" "Are there two bins in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3342.jpg" +"3343" "Is the vase 1 in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3343.jpg" +"3344" "Is the vase 2 in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3344.jpg" +"3345" "Is there one spray in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3345.jpg" +"3346" "Are there two sprays in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3346.jpg" +"3347" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3347.jpg" +"3348" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3348.jpg" +"3349" "Are there three dolls in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3349.jpg" +"3350" "Are there four dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3350.jpg" +"3351" "Is the book open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3351.jpg" +"3352" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3352.jpg" +"3353" "Are there two giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3353.jpg" +"3354" "Are there three giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3354.jpg" +"3355" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3355.jpg" +"3356" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3356.jpg" +"3357" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3357.jpg" +"3358" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3358.jpg" +"3359" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3359.jpg" +"3360" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3360.jpg" +"3361" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3361.jpg" +"3362" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3362.jpg" +"3363" "Is the sea restless in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3363.jpg" +"3364" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3364.jpg" +"3365" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3365.jpg" +"3366" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3366.jpg" +"3367" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3367.jpg" +"3368" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3368.jpg" +"3369" "Are there seven planes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3369.jpg" +"3370" "Are there eight planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3370.jpg" +"3371" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3371.jpg" +"3372" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3372.jpg" +"3373" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3373.jpg" +"3374" "Does the cat run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3374.jpg" +"3375" "Is there one shoe in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3375.jpg" +"3376" "Are there two shoes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3376.jpg" +"3377" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3377.jpg" +"3378" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3378.jpg" +"3379" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3379.jpg" +"3380" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3380.jpg" +"3381" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3381.jpg" +"3382" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3382.jpg" +"3383" "Is the keyboard black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3383.jpg" +"3384" "Is the keyboard white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3384.jpg" +"3385" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3385.jpg" +"3386" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3386.jpg" +"3387" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3387.jpg" +"3388" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3388.jpg" +"3389" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3389.jpg" +"3390" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3390.jpg" +"3391" "Are there three zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3391.jpg" +"3392" "Are there four zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3392.jpg" +"3393" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3393.jpg" +"3394" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3394.jpg" +"3395" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3395.jpg" +"3396" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3396.jpg" +"3397" "Are there three surfboards in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3397.jpg" +"3398" "Are there four surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3398.jpg" +"3399" "Are there three people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3399.jpg" +"3400" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3400.jpg" +"3401" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3401.jpg" +"3402" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3402.jpg" +"3403" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3403.jpg" +"3404" "Is the wall uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3404.jpg" +"3405" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3405.jpg" +"3406" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3406.jpg" +"3407" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3407.jpg" +"3408" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3408.jpg" +"3409" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3409.jpg" +"3410" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3410.jpg" +"3411" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3411.jpg" +"3412" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3412.jpg" +"3413" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3413.jpg" +"3414" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3414.jpg" +"3415" "Is the bus red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3415.jpg" +"3416" "Is the bus white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3416.jpg" +"3417" "Is the tree withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3417.jpg" +"3418" "Is the tree lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3418.jpg" +"3419" "Is the wall tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3419.jpg" +"3420" "Is the wall short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3420.jpg" +"3421" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3421.jpg" +"3422" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3422.jpg" +"3423" "Is the house good-looking in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3423.jpg" +"3424" "Is the house ugly in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3424.jpg" +"3425" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3425.jpg" +"3426" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3426.jpg" +"3427" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3427.jpg" +"3428" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3428.jpg" +"3429" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3429.jpg" +"3430" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3430.jpg" +"3431" "Does the woman run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3431.jpg" +"3432" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3432.jpg" +"3433" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3433.jpg" +"3434" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3434.jpg" +"3435" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3435.jpg" +"3436" "Is the sky green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3436.jpg" +"3437" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3437.jpg" +"3438" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3438.jpg" +"3439" "Is there one bus in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3439.jpg" +"3440" "Are there two buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3440.jpg" +"3441" "Is the mountain green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3441.jpg" +"3442" "Is the mountain blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3442.jpg" +"3443" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3443.jpg" +"3444" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3444.jpg" +"3445" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3445.jpg" +"3446" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3446.jpg" +"3447" "Is the river sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3447.jpg" +"3448" "Is the river calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3448.jpg" +"3449" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3449.jpg" +"3450" "Is the tree black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3450.jpg" +"3451" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3451.jpg" +"3452" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3452.jpg" +"3453" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3453.jpg" +"3454" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3454.jpg" +"3455" "Is the cat lie prone in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3455.jpg" +"3456" "Is the cat stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3456.jpg" +"3457" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3457.jpg" +"3458" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3458.jpg" +"3459" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3459.jpg" +"3460" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3460.jpg" +"3461" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3461.jpg" +"3462" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3462.jpg" +"3463" "Is the tussock dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3463.jpg" +"3464" "Is the tussock sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3464.jpg" +"3465" "Does the cat stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3465.jpg" +"3466" "Does the cat lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3466.jpg" +"3467" "Are there two shoes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3467.jpg" +"3468" "Are there six shoes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3468.jpg" +"3469" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3469.jpg" +"3470" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3470.jpg" +"3471" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3471.jpg" +"3472" "Is the toilet blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3472.jpg" +"3473" "Are there three pipes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3473.jpg" +"3474" "Are there four pipes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3474.jpg" +"3475" "Is the wall clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3475.jpg" +"3476" "Is the wall dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3476.jpg" +"3477" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3477.jpg" +"3478" "Is the grass pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3478.jpg" +"3479" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3479.jpg" +"3480" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3480.jpg" +"3481" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3481.jpg" +"3482" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3482.jpg" +"3483" "Is the fence short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3483.jpg" +"3484" "Is the fence tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3484.jpg" +"3485" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3485.jpg" +"3486" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3486.jpg" +"3487" "Is the tussock withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3487.jpg" +"3488" "Is the tussock lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3488.jpg" +"3489" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3489.jpg" +"3490" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3490.jpg" +"3491" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3491.jpg" +"3492" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3492.jpg" +"3493" "Are there two elephants in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3493.jpg" +"3494" "Are there three elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3494.jpg" +"3495" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3495.jpg" +"3496" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3496.jpg" +"3497" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3497.jpg" +"3498" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3498.jpg" +"3499" "Does the monkey scratch in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3499.jpg" +"3500" "Does the monkey release in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3500.jpg" +"3501" "Is the banana incomplete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3501.jpg" +"3502" "Is the banana complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3502.jpg" +"3503" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3503.jpg" +"3504" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3504.jpg" +"3505" "Is the hydrant closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3505.jpg" +"3506" "Is the hydrant open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3506.jpg" +"3507" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3507.jpg" +"3508" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3508.jpg" +"3509" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3509.jpg" +"3510" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3510.jpg" +"3511" "Does the sheep stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3511.jpg" +"3512" "Does the sheep run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3512.jpg" +"3513" "Is the fence firm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3513.jpg" +"3514" "Is the fence broken in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3514.jpg" +"3515" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3515.jpg" +"3516" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3516.jpg" +"3517" "Is the carrot orange in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3517.jpg" +"3518" "Is the carrot purple in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3518.jpg" +"3519" "Is there one necklace in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3519.jpg" +"3520" "Are there three necklaces in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3520.jpg" +"3521" "Is the sky gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3521.jpg" +"3522" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3522.jpg" +"3523" "Is the cloud gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3523.jpg" +"3524" "Is the cloud white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3524.jpg" +"3525" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3525.jpg" +"3526" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3526.jpg" +"3527" "Is the sign square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3527.jpg" +"3528" "Is the sign round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3528.jpg" +"3529" "Is the keyboard square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3529.jpg" +"3530" "Is the keyboard round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3530.jpg" +"3531" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3531.jpg" +"3532" "Are there two mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3532.jpg" +"3533" "Are there two lounges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3533.jpg" +"3534" "Are there three lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3534.jpg" +"3535" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3535.jpg" +"3536" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3536.jpg" +"3537" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3537.jpg" +"3538" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3538.jpg" +"3539" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3539.jpg" +"3540" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3540.jpg" +"3541" "Is the umbrella spread out in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3541.jpg" +"3542" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3542.jpg" +"3543" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3543.jpg" +"3544" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3544.jpg" +"3545" "Is the bookshelf brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3545.jpg" +"3546" "Is the bookshelf black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3546.jpg" +"3547" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3547.jpg" +"3548" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3548.jpg" +"3549" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3549.jpg" +"3550" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3550.jpg" +"3551" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3551.jpg" +"3552" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3552.jpg" +"3553" "Is the mountain steep in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3553.jpg" +"3554" "Is the mountain gentle in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3554.jpg" +"3555" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3555.jpg" +"3556" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3556.jpg" +"3557" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3557.jpg" +"3558" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3558.jpg" +"3559" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3559.jpg" +"3560" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3560.jpg" +"3561" "Is the sheep white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3561.jpg" +"3562" "Is the sheep black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3562.jpg" +"3563" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3563.jpg" +"3564" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3564.jpg" +"3565" "Is the forest emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3565.jpg" +"3566" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3566.jpg" +"3567" "Does the man cycling in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3567.jpg" +"3568" "Does the man stop in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3568.jpg" +"3569" "Does the woman cycling in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3569.jpg" +"3570" "Does the woman stop in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3570.jpg" +"3571" "Are there two bicycles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3571.jpg" +"3572" "Are there three bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3572.jpg" +"3573" "Are there six cows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3573.jpg" +"3574" "Are there seven cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3574.jpg" +"3575" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3575.jpg" +"3576" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3576.jpg" +"3577" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3577.jpg" +"3578" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3578.jpg" +"3579" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3579.jpg" +"3580" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3580.jpg" +"3581" "Is the toilet dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3581.jpg" +"3582" "Is the toilet pure white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3582.jpg" +"3583" "Are there two papers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3583.jpg" +"3584" "Are there three papers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3584.jpg" +"3585" "Is the tank white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3585.jpg" +"3586" "Is the tank black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3586.jpg" +"3587" "Is the box closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3587.jpg" +"3588" "Is the box open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3588.jpg" +"3589" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3589.jpg" +"3590" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3590.jpg" +"3591" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3591.jpg" +"3592" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3592.jpg" +"3593" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3593.jpg" +"3594" "Is the forest withering in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3594.jpg" +"3595" "Is the ground uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3595.jpg" +"3596" "Is the ground smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3596.jpg" +"3597" "Is the cloud gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3597.jpg" +"3598" "Is the cloud white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3598.jpg" +"3599" "Are there two bicycles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3599.jpg" +"3600" "Are there four bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3600.jpg" +"3601" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3601.jpg" +"3602" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3602.jpg" +"3603" "Is the house red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3603.jpg" +"3604" "Is the house white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3604.jpg" +"3605" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3605.jpg" +"3606" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3606.jpg" +"3607" "Is the hydrant closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3607.jpg" +"3608" "Is the hydrant started in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3608.jpg" +"3609" "Is the sky gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3609.jpg" +"3610" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3610.jpg" +"3611" "Is the necklace black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3611.jpg" +"3612" "Is the necklace white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3612.jpg" +"3613" "Does the dog slide in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3613.jpg" +"3614" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3614.jpg" +"3615" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3615.jpg" +"3616" "Are there three skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3616.jpg" +"3617" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3617.jpg" +"3618" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3618.jpg" +"3619" "Is the fence white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3619.jpg" +"3620" "Is the fence blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3620.jpg" +"3621" "Is the scarf yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3621.jpg" +"3622" "Is the scarf white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3622.jpg" +"3623" "Is the rope long in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3623.jpg" +"3624" "Is the rope short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3624.jpg" +"3625" "Are there two bicycles in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3625.jpg" +"3626" "Are there three bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3626.jpg" +"3627" "Is the cup blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3627.jpg" +"3628" "Is the cup white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3628.jpg" +"3629" "Is there one coffee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3629.jpg" +"3630" "Are there two coffees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3630.jpg" +"3631" "Are there two plates in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3631.jpg" +"3632" "Are there three plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3632.jpg" +"3633" "Are there two doughnuts in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3633.jpg" +"3634" "Are there three doughnuts in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3634.jpg" +"3635" "Is the mirror complete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3635.jpg" +"3636" "Is the mirror broken in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3636.jpg" +"3637" "Are there two toothbrushes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3637.jpg" +"3638" "Are there five toothbrushes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3638.jpg" +"3639" "Is the cup brown in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3639.jpg" +"3640" "Is the cup blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3640.jpg" +"3641" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3641.jpg" +"3642" "Is the lake calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3642.jpg" +"3643" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3643.jpg" +"3644" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3644.jpg" +"3645" "Is the pulp oval in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3645.jpg" +"3646" "Is the pulp square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3646.jpg" +"3647" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3647.jpg" +"3648" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3648.jpg" +"3649" "Is the paddle black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3649.jpg" +"3650" "Is the paddle white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3650.jpg" +"3651" "Is the necklace black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3651.jpg" +"3652" "Is the necklace white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3652.jpg" +"3653" "Is the ground smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3653.jpg" +"3654" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3654.jpg" +"3655" "Are there two buses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3655.jpg" +"3656" "Are there four buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3656.jpg" +"3657" "Are there three cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3657.jpg" +"3658" "Are there five cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3658.jpg" +"3659" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3659.jpg" +"3660" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3660.jpg" +"3661" "Is the tree emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3661.jpg" +"3662" "Is the tree yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3662.jpg" +"3663" "Are there two streetlamps in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3663.jpg" +"3664" "Are there six streetlamps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3664.jpg" +"3665" "Does the zebra lower in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3665.jpg" +"3666" "Does the zebra raise in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3666.jpg" +"3667" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3667.jpg" +"3668" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3668.jpg" +"3669" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3669.jpg" +"3670" "Is the forest withering in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3670.jpg" +"3671" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3671.jpg" +"3672" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3672.jpg" +"3673" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3673.jpg" +"3674" "Does the woman run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3674.jpg" +"3675" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3675.jpg" +"3676" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3676.jpg" +"3677" "Are there three horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3677.jpg" +"3678" "Are there five horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3678.jpg" +"3679" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3679.jpg" +"3680" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3680.jpg" +"3681" "Does the bear walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3681.jpg" +"3682" "Does the bear run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3682.jpg" +"3683" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3683.jpg" +"3684" "Is the forest withering in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3684.jpg" +"3685" "Is the wall uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3685.jpg" +"3686" "Is the wall smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3686.jpg" +"3687" "Does the man scratch in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3687.jpg" +"3688" "Does the man release in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3688.jpg" +"3689" "Is the bowl white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3689.jpg" +"3690" "Is the bowl black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3690.jpg" +"3691" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3691.jpg" +"3692" "Is the plate blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3692.jpg" +"3693" "Is the tree withering in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3693.jpg" +"3694" "Is the tree lush in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3694.jpg" +"3695" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3695.jpg" +"3696" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3696.jpg" +"3697" "Does the dog raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3697.jpg" +"3698" "Does the dog lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3698.jpg" +"3699" "Is the frisbee yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3699.jpg" +"3700" "Is the frisbee gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3700.jpg" +"3701" "Is the grass yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3701.jpg" +"3702" "Is the grass green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3702.jpg" +"3703" "Does the woman scratch in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3703.jpg" +"3704" "Does the woman release in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3704.jpg" +"3705" "Is there one phone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3705.jpg" +"3706" "Are there two phones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3706.jpg" +"3707" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3707.jpg" +"3708" "Is the toilet gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3708.jpg" +"3709" "Is the bin black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3709.jpg" +"3710" "Is the bin white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3710.jpg" +"3711" "Is the towel white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3711.jpg" +"3712" "Is the towel yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3712.jpg" +"3713" "Are there two beds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3713.jpg" +"3714" "Are there three beds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3714.jpg" +"3715" "Are there three pillows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3715.jpg" +"3716" "Are there five pillows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3716.jpg" +"3717" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3717.jpg" +"3718" "Is the wall green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3718.jpg" +"3719" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3719.jpg" +"3720" "Does the person slide in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3720.jpg" +"3721" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3721.jpg" +"3722" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3722.jpg" +"3723" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3723.jpg" +"3724" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3724.jpg" +"3725" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3725.jpg" +"3726" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3726.jpg" +"3727" "Does the cat stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3727.jpg" +"3728" "Does the cat run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3728.jpg" +"3729" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3729.jpg" +"3730" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3730.jpg" +"3731" "Are there three sunflowers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3731.jpg" +"3732" "Are there five sunflowers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3732.jpg" +"3733" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3733.jpg" +"3734" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3734.jpg" +"3735" "Is the wall uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3735.jpg" +"3736" "Is the wall smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3736.jpg" +"3737" "Does the bear sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3737.jpg" +"3738" "Does the bear run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3738.jpg" +"3739" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3739.jpg" +"3740" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3740.jpg" +"3741" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3741.jpg" +"3742" "Is the forest withering in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3742.jpg" +"3743" "Is the house blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3743.jpg" +"3744" "Is the house red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3744.jpg" +"3745" "Is the cloud gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3745.jpg" +"3746" "Is the cloud white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3746.jpg" +"3747" "Is the fence damaged in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3747.jpg" +"3748" "Is the fence intact in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3748.jpg" +"3749" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3749.jpg" +"3750" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3750.jpg" +"3751" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3751.jpg" +"3752" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3752.jpg" +"3753" "Is there one fork in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3753.jpg" +"3754" "Are there two forks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3754.jpg" +"3755" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3755.jpg" +"3756" "Is the plate gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3756.jpg" +"3757" "Is there one cake in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3757.jpg" +"3758" "Are there three cakes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3758.jpg" +"3759" "Is the bench black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3759.jpg" +"3760" "Is the bench white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3760.jpg" +"3761" "Does the woman lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3761.jpg" +"3762" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3762.jpg" +"3763" "Is the book spread out in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3763.jpg" +"3764" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3764.jpg" +"3765" "Are there two sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3765.jpg" +"3766" "Are there three sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3766.jpg" +"3767" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3767.jpg" +"3768" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3768.jpg" +"3769" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3769.jpg" +"3770" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3770.jpg" +"3771" "Does the elephant walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3771.jpg" +"3772" "Does the elephant run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3772.jpg" +"3773" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3773.jpg" +"3774" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3774.jpg" +"3775" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3775.jpg" +"3776" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3776.jpg" +"3777" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3777.jpg" +"3778" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3778.jpg" +"3779" "Is there one doll in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3779.jpg" +"3780" "Are there two dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3780.jpg" +"3781" "Is the chair black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3781.jpg" +"3782" "Is the chair yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3782.jpg" +"3783" "Is the phone started in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3783.jpg" +"3784" "Is the phone closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3784.jpg" +"3785" "Is the table yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3785.jpg" +"3786" "Is the table white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3786.jpg" +"3787" "Is the forest verdant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3787.jpg" +"3788" "Is the forest barren in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3788.jpg" +"3789" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3789.jpg" +"3790" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3790.jpg" +"3791" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3791.jpg" +"3792" "Are there three bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3792.jpg" +"3793" "Does the truck stop in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3793.jpg" +"3794" "Does the truck sport in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3794.jpg" +"3795" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3795.jpg" +"3796" "Are there three trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3796.jpg" +"3797" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3797.jpg" +"3798" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3798.jpg" +"3799" "Is the ground muddy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3799.jpg" +"3800" "Is the ground concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3800.jpg" +"3801" "Is the rail straight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3801.jpg" +"3802" "Is the rail curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3802.jpg" +"3803" "Is there one cake in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3803.jpg" +"3804" "Are there three cakes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3804.jpg" +"3805" "Is the kiwifruit green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3805.jpg" +"3806" "Is the kiwifruit yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3806.jpg" +"3807" "Is the peach yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3807.jpg" +"3808" "Is the peach red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3808.jpg" +"3809" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3809.jpg" +"3810" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3810.jpg" +"3811" "Is the snow pristine in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3811.jpg" +"3812" "Is the snow filthy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3812.jpg" +"3813" "Is the forest sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3813.jpg" +"3814" "Is the forest dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3814.jpg" +"3815" "Is the sun semicircle in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3815.jpg" +"3816" "Is the sun round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3816.jpg" +"3817" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3817.jpg" +"3818" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3818.jpg" +"3819" "Does the parasail glide in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3819.jpg" +"3820" "Does the parasail stop in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3820.jpg" +"3821" "Does the person fly in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3821.jpg" +"3822" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3822.jpg" +"3823" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3823.jpg" +"3824" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3824.jpg" +"3825" "Are there two toothbrushes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3825.jpg" +"3826" "Are there six toothbrushes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3826.jpg" +"3827" "Is there one toothpaste in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3827.jpg" +"3828" "Are there three toothpastes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3828.jpg" +"3829" "Is the table wooden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3829.jpg" +"3830" "Is the table tiled in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3830.jpg" +"3831" "Is the wall striped in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3831.jpg" +"3832" "Is the wall floral in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3832.jpg" +"3833" "Is the forest colorful in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3833.jpg" +"3834" "Is the forest sparse vegetation in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3834.jpg" +"3835" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3835.jpg" +"3836" "Is the lake turbulent and surging in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3836.jpg" +"3837" "Is the paddle wooden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3837.jpg" +"3838" "Is the paddle plastic in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3838.jpg" +"3839" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3839.jpg" +"3840" "Are there three ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3840.jpg" +"3841" "Are there four people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3841.jpg" +"3842" "Are there five people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3842.jpg" +"3843" "Does the umbrella open in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3843.jpg" +"3844" "Does the umbrella close in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3844.jpg" +"3845" "Is there one zebra in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3845.jpg" +"3846" "Are there three zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3846.jpg" +"3847" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3847.jpg" +"3848" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3848.jpg" +"3849" "Does the car park in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3849.jpg" +"3850" "Does the car drive in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3850.jpg" +"3851" "Is the grass verdant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3851.jpg" +"3852" "Is the grass withering in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3852.jpg" +"3853" "Is the forest layered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3853.jpg" +"3854" "Is the forest yellowing leaves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3854.jpg" +"3855" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3855.jpg" +"3856" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3856.jpg" +"3857" "Is the cloud pristine in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3857.jpg" +"3858" "Is the cloud cloudy skies in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3858.jpg" +"3859" "Is the forest sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3859.jpg" +"3860" "Is the forest dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3860.jpg" +"3861" "Is the river calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3861.jpg" +"3862" "Is the river stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3862.jpg" +"3863" "Does the bicycle stop in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3863.jpg" +"3864" "Does the bicycle drive in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3864.jpg" +"3865" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3865.jpg" +"3866" "Are there three toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3866.jpg" +"3867" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3867.jpg" +"3868" "Are there three toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3868.jpg" +"3869" "Is the floor tiled in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3869.jpg" +"3870" "Is the floor wooden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3870.jpg" +"3871" "Is the cabinet natural wood color in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3871.jpg" +"3872" "Is the cabinet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3872.jpg" +"3873" "Is the tissue cylindrical in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3873.jpg" +"3874" "Is the tissue square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3874.jpg" +"3875" "Is there one holder in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3875.jpg" +"3876" "Are there three holders in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3876.jpg" +"3877" "Is the wall patterned in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3877.jpg" +"3878" "Is the wall solid color in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3878.jpg" +"3879" "Is the sea rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3879.jpg" +"3880" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3880.jpg" +"3881" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3881.jpg" +"3882" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3882.jpg" +"3883" "Is the cloud spotless in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3883.jpg" +"3884" "Is the cloud filthy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3884.jpg" +"3885" "Is the tree sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3885.jpg" +"3886" "Is the tree dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3886.jpg" +"3887" "Are there two lounges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3887.jpg" +"3888" "Are there three lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3888.jpg" +"3889" "Does the person cycling in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3889.jpg" +"3890" "Does the person stop in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3890.jpg" +"3891" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3891.jpg" +"3892" "Are there three motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3892.jpg" +"3893" "Is the flower pink in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3893.jpg" +"3894" "Is the flower yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3894.jpg" +"3895" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3895.jpg" +"3896" "Is the forest yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3896.jpg" +"3897" "Is there one cone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3897.jpg" +"3898" "Are there three cones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3898.jpg" +"3899" "Is the hydrant black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3899.jpg" +"3900" "Is the hydrant red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3900.jpg" +"3901" "Is the cat lie down in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3901.jpg" +"3902" "Is the cat stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3902.jpg" +"3903" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3903.jpg" +"3904" "Are there two mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3904.jpg" +"3905" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3905.jpg" +"3906" "Is the keyboard silver in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3906.jpg" +"3907" "Does the bus motionless in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3907.jpg" +"3908" "Does the bus driving in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3908.jpg" +"3909" "Is the sky pure white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3909.jpg" +"3910" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3910.jpg" +"3911" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3911.jpg" +"3912" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3912.jpg" +"3913" "Are there two computers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3913.jpg" +"3914" "Are there five computers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3914.jpg" +"3915" "Is the mouse black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3915.jpg" +"3916" "Is the mouse pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3916.jpg" +"3917" "Is the keyboard black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3917.jpg" +"3918" "Is the keyboard white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3918.jpg" +"3919" "Is the table yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3919.jpg" +"3920" "Is the table white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3920.jpg" +"3921" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3921.jpg" +"3922" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3922.jpg" +"3923" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3923.jpg" +"3924" "Are there three ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3924.jpg" +"3925" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3925.jpg" +"3926" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3926.jpg" +"3927" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3927.jpg" +"3928" "Are there three surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3928.jpg" +"3929" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3929.jpg" +"3930" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3930.jpg" +"3931" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3931.jpg" +"3932" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3932.jpg" +"3933" "Does the train drive in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3933.jpg" +"3934" "Does the train stop in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3934.jpg" +"3935" "Is the rail straight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3935.jpg" +"3936" "Is the rail curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3936.jpg" +"3937" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3937.jpg" +"3938" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3938.jpg" +"3939" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3939.jpg" +"3940" "Is the grass barren in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3940.jpg" +"3941" "Is the forest verdant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3941.jpg" +"3942" "Is the forest falling yellow leaves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3942.jpg" +"3943" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3943.jpg" +"3944" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3944.jpg" +"3945" "Are there four people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3945.jpg" +"3946" "Are there five people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3946.jpg" +"3947" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3947.jpg" +"3948" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3948.jpg" +"3949" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3949.jpg" +"3950" "Are there three trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3950.jpg" +"3951" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3951.jpg" +"3952" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3952.jpg" +"3953" "Is there one house in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3953.jpg" +"3954" "Are there three houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3954.jpg" +"3955" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3955.jpg" +"3956" "Is the sun gentle in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3956.jpg" +"3957" "Is the sky pure white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3957.jpg" +"3958" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3958.jpg" +"3959" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3959.jpg" +"3960" "Are there three hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3960.jpg" +"3961" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3961.jpg" +"3962" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3962.jpg" +"3963" "Is the forest shaded by green trees in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3963.jpg" +"3964" "Is the forest fruit trees withering in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3964.jpg" +"3965" "Does the cat bite in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3965.jpg" +"3966" "Does the cat scratch in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3966.jpg" +"3967" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3967.jpg" +"3968" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3968.jpg" +"3969" "Is the bear cute in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3969.jpg" +"3970" "Is the bear annoying in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3970.jpg" +"3971" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3971.jpg" +"3972" "Does the cat run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3972.jpg" +"3973" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3973.jpg" +"3974" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3974.jpg" +"3975" "Is there one flowerpot in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3975.jpg" +"3976" "Are there two flowerpots in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3976.jpg" +"3977" "Is the pot complete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3977.jpg" +"3978" "Is the pot damaged in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3978.jpg" +"3979" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3979.jpg" +"3980" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3980.jpg" +"3981" "Is the reef hard in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3981.jpg" +"3982" "Is the reef soft in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3982.jpg" +"3983" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3983.jpg" +"3984" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3984.jpg" +"3985" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3985.jpg" +"3986" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3986.jpg" +"3987" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3987.jpg" +"3988" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3988.jpg" +"3989" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3989.jpg" +"3990" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3990.jpg" +"3991" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3991.jpg" +"3992" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3992.jpg" +"3993" "Is there one parasail in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3993.jpg" +"3994" "Are there two parasails in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3994.jpg" +"3995" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3995.jpg" +"3996" "Is the snow green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3996.jpg" +"3997" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3997.jpg" +"3998" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3998.jpg" +"3999" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/3999.jpg" +"4000" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4000.jpg" +"4001" "Is the bench white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4001.jpg" +"4002" "Is the bench black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4002.jpg" +"4003" "Is there one doll in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4003.jpg" +"4004" "Are there two dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4004.jpg" +"4005" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4005.jpg" +"4006" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4006.jpg" +"4007" "Is the road clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4007.jpg" +"4008" "Is the road dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4008.jpg" +"4009" "Is the sand dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4009.jpg" +"4010" "Is the sand wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4010.jpg" +"4011" "Is there one bus in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4011.jpg" +"4012" "Are there two buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4012.jpg" +"4013" "Is the table neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4013.jpg" +"4014" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4014.jpg" +"4015" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4015.jpg" +"4016" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4016.jpg" +"4017" "Are there two laptops in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4017.jpg" +"4018" "Are there three laptops in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4018.jpg" +"4019" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4019.jpg" +"4020" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4020.jpg" +"4021" "Is the bag black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4021.jpg" +"4022" "Is the bag white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4022.jpg" +"4023" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4023.jpg" +"4024" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4024.jpg" +"4025" "Are there six sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4025.jpg" +"4026" "Are there eight sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4026.jpg" +"4027" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4027.jpg" +"4028" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4028.jpg" +"4029" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4029.jpg" +"4030" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4030.jpg" +"4031" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4031.jpg" +"4032" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4032.jpg" +"4033" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4033.jpg" +"4034" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4034.jpg" +"4035" "Does the horse stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4035.jpg" +"4036" "Does the horse lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4036.jpg" +"4037" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4037.jpg" +"4038" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4038.jpg" +"4039" "Is the manhole round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4039.jpg" +"4040" "Is the manhole square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4040.jpg" +"4041" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4041.jpg" +"4042" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4042.jpg" +"4043" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4043.jpg" +"4044" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4044.jpg" +"4045" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4045.jpg" +"4046" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4046.jpg" +"4047" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4047.jpg" +"4048" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4048.jpg" +"4049" "Is there one electrombile in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4049.jpg" +"4050" "Are there two electrombiles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4050.jpg" +"4051" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4051.jpg" +"4052" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4052.jpg" +"4053" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4053.jpg" +"4054" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4054.jpg" +"4055" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4055.jpg" +"4056" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4056.jpg" +"4057" "Are there two shoes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4057.jpg" +"4058" "Are there three shoes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4058.jpg" +"4059" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4059.jpg" +"4060" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4060.jpg" +"4061" "Is the cloth messy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4061.jpg" +"4062" "Is the cloth neat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4062.jpg" +"4063" "Is the pillow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4063.jpg" +"4064" "Is the pillow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4064.jpg" +"4065" "Is the curtain linen in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4065.jpg" +"4066" "Is the curtain green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4066.jpg" +"4067" "Are there two dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4067.jpg" +"4068" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4068.jpg" +"4069" "Is the quilt spread out in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4069.jpg" +"4070" "Is the quilt folded in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4070.jpg" +"4071" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4071.jpg" +"4072" "Is the wall uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4072.jpg" +"4073" "Is the bed neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4073.jpg" +"4074" "Is the bed messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4074.jpg" +"4075" "Are there four pillows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4075.jpg" +"4076" "Are there six pillows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4076.jpg" +"4077" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4077.jpg" +"4078" "Is the wall uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4078.jpg" +"4079" "Is there one lamp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4079.jpg" +"4080" "Are there two lamps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4080.jpg" +"4081" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4081.jpg" +"4082" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4082.jpg" +"4083" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4083.jpg" +"4084" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4084.jpg" +"4085" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4085.jpg" +"4086" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4086.jpg" +"4087" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4087.jpg" +"4088" "Is the wall uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4088.jpg" +"4089" "Is the door closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4089.jpg" +"4090" "Is the door open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4090.jpg" +"4091" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4091.jpg" +"4092" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4092.jpg" +"4093" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4093.jpg" +"4094" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4094.jpg" +"4095" "Is the wall pink in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4095.jpg" +"4096" "Is the wall green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4096.jpg" +"4097" "Is the floor pink in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4097.jpg" +"4098" "Is the floor black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4098.jpg" +"4099" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4099.jpg" +"4100" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4100.jpg" +"4101" "Does the zebra stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4101.jpg" +"4102" "Does the zebra sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4102.jpg" +"4103" "Is there one antelope in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4103.jpg" +"4104" "Are there two antelopes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4104.jpg" +"4105" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4105.jpg" +"4106" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4106.jpg" +"4107" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4107.jpg" +"4108" "Is the forest red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4108.jpg" +"4109" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4109.jpg" +"4110" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4110.jpg" +"4111" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4111.jpg" +"4112" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4112.jpg" +"4113" "Does the woman horseback riding in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4113.jpg" +"4114" "Does the woman walk in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4114.jpg" +"4115" "Is there one phone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4115.jpg" +"4116" "Are there two phones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4116.jpg" +"4117" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4117.jpg" +"4118" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4118.jpg" +"4119" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4119.jpg" +"4120" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4120.jpg" +"4121" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4121.jpg" +"4122" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4122.jpg" +"4123" "Is the sea turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4123.jpg" +"4124" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4124.jpg" +"4125" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4125.jpg" +"4126" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4126.jpg" +"4127" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4127.jpg" +"4128" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4128.jpg" +"4129" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4129.jpg" +"4130" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4130.jpg" +"4131" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4131.jpg" +"4132" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4132.jpg" +"4133" "Are there two birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4133.jpg" +"4134" "Are there three birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4134.jpg" +"4135" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4135.jpg" +"4136" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4136.jpg" +"4137" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4137.jpg" +"4138" "Are there two keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4138.jpg" +"4139" "Is there one controller in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4139.jpg" +"4140" "Are there six controllers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4140.jpg" +"4141" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4141.jpg" +"4142" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4142.jpg" +"4143" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4143.jpg" +"4144" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4144.jpg" +"4145" "Are there two urinals in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4145.jpg" +"4146" "Are there four urinals in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4146.jpg" +"4147" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4147.jpg" +"4148" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4148.jpg" +"4149" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4149.jpg" +"4150" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4150.jpg" +"4151" "Is there one water in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4151.jpg" +"4152" "Are there two waters in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4152.jpg" +"4153" "Is the bread delicious in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4153.jpg" +"4154" "Is the bread unappetizing in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4154.jpg" +"4155" "Is the chair black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4155.jpg" +"4156" "Is the chair white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4156.jpg" +"4157" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4157.jpg" +"4158" "Is the wall red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4158.jpg" +"4159" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4159.jpg" +"4160" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4160.jpg" +"4161" "Is the cup full in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4161.jpg" +"4162" "Is the cup empty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4162.jpg" +"4163" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4163.jpg" +"4164" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4164.jpg" +"4165" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4165.jpg" +"4166" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4166.jpg" +"4167" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4167.jpg" +"4168" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4168.jpg" +"4169" "Is the road curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4169.jpg" +"4170" "Is the road straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4170.jpg" +"4171" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4171.jpg" +"4172" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4172.jpg" +"4173" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4173.jpg" +"4174" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4174.jpg" +"4175" "Are there three apples in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4175.jpg" +"4176" "Are there five apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4176.jpg" +"4177" "Is there one tape in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4177.jpg" +"4178" "Are there two tapes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4178.jpg" +"4179" "Are there two computers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4179.jpg" +"4180" "Are there three computers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4180.jpg" +"4181" "Does the table tidy in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4181.jpg" +"4182" "Does the table messy in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4182.jpg" +"4183" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4183.jpg" +"4184" "Are there two keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4184.jpg" +"4185" "Is the mouse white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4185.jpg" +"4186" "Is the mouse black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4186.jpg" +"4187" "Is the sound white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4187.jpg" +"4188" "Is the sound pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4188.jpg" +"4189" "Is the chair comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4189.jpg" +"4190" "Is the chair uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4190.jpg" +"4191" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4191.jpg" +"4192" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4192.jpg" +"4193" "Is the floor dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4193.jpg" +"4194" "Is the floor clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4194.jpg" +"4195" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4195.jpg" +"4196" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4196.jpg" +"4197" "Is there one bin in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4197.jpg" +"4198" "Are there two bins in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4198.jpg" +"4199" "Is the lounge white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4199.jpg" +"4200" "Is the lounge black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4200.jpg" +"4201" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4201.jpg" +"4202" "Does the person jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4202.jpg" +"4203" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4203.jpg" +"4204" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4204.jpg" +"4205" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4205.jpg" +"4206" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4206.jpg" +"4207" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4207.jpg" +"4208" "Are there two toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4208.jpg" +"4209" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4209.jpg" +"4210" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4210.jpg" +"4211" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4211.jpg" +"4212" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4212.jpg" +"4213" "Is the tussock green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4213.jpg" +"4214" "Is the tussock yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4214.jpg" +"4215" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4215.jpg" +"4216" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4216.jpg" +"4217" "Is the train long in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4217.jpg" +"4218" "Is the train short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4218.jpg" +"4219" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4219.jpg" +"4220" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4220.jpg" +"4221" "Is the wall rough in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4221.jpg" +"4222" "Is the wall smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4222.jpg" +"4223" "Is there one bottle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4223.jpg" +"4224" "Are there two bottles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4224.jpg" +"4225" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4225.jpg" +"4226" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4226.jpg" +"4227" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4227.jpg" +"4228" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4228.jpg" +"4229" "Is there one sunglasses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4229.jpg" +"4230" "Are there three sunglass in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4230.jpg" +"4231" "Is the camera black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4231.jpg" +"4232" "Is the camera blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4232.jpg" +"4233" "Does the person get in the water in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4233.jpg" +"4234" "Does the person come ashore in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4234.jpg" +"4235" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4235.jpg" +"4236" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4236.jpg" +"4237" "Is the sea rolling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4237.jpg" +"4238" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4238.jpg" +"4239" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4239.jpg" +"4240" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4240.jpg" +"4241" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4241.jpg" +"4242" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4242.jpg" +"4243" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4243.jpg" +"4244" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4244.jpg" +"4245" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4245.jpg" +"4246" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4246.jpg" +"4247" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4247.jpg" +"4248" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4248.jpg" +"4249" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4249.jpg" +"4250" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4250.jpg" +"4251" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4251.jpg" +"4252" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4252.jpg" +"4253" "Are there two lounges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4253.jpg" +"4254" "Are there three lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4254.jpg" +"4255" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4255.jpg" +"4256" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4256.jpg" +"4257" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4257.jpg" +"4258" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4258.jpg" +"4259" "Is the sea vast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4259.jpg" +"4260" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4260.jpg" +"4261" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4261.jpg" +"4262" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4262.jpg" +"4263" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4263.jpg" +"4264" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4264.jpg" +"4265" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4265.jpg" +"4266" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4266.jpg" +"4267" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4267.jpg" +"4268" "Does the cat jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4268.jpg" +"4269" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4269.jpg" +"4270" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4270.jpg" +"4271" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4271.jpg" +"4272" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4272.jpg" +"4273" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4273.jpg" +"4274" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4274.jpg" +"4275" "Is the manhole round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4275.jpg" +"4276" "Is the manhole square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4276.jpg" +"4277" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4277.jpg" +"4278" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4278.jpg" +"4279" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4279.jpg" +"4280" "Are there two keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4280.jpg" +"4281" "Is the flower vibrant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4281.jpg" +"4282" "Is the flower understated in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4282.jpg" +"4283" "Is the fence red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4283.jpg" +"4284" "Is the fence white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4284.jpg" +"4285" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4285.jpg" +"4286" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4286.jpg" +"4287" "Is there one kettle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4287.jpg" +"4288" "Are there two kettles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4288.jpg" +"4289" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4289.jpg" +"4290" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4290.jpg" +"4291" "Does the cat stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4291.jpg" +"4292" "Does the cat sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4292.jpg" +"4293" "Is there one electrombile in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4293.jpg" +"4294" "Are there two electrombiles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4294.jpg" +"4295" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4295.jpg" +"4296" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4296.jpg" +"4297" "Is the house old in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4297.jpg" +"4298" "Is the house new in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4298.jpg" +"4299" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4299.jpg" +"4300" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4300.jpg" +"4301" "Is there one orange in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4301.jpg" +"4302" "Are there two oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4302.jpg" +"4303" "Is the laptop closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4303.jpg" +"4304" "Is the laptop open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4304.jpg" +"4305" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4305.jpg" +"4306" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4306.jpg" +"4307" "Are there five sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4307.jpg" +"4308" "Are there eight sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4308.jpg" +"4309" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4309.jpg" +"4310" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4310.jpg" +"4311" "Is there one light in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4311.jpg" +"4312" "Are there two lights in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4312.jpg" +"4313" "Is the tap open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4313.jpg" +"4314" "Is the tap closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4314.jpg" +"4315" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4315.jpg" +"4316" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4316.jpg" +"4317" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4317.jpg" +"4318" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4318.jpg" +"4319" "Is the streetlamp closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4319.jpg" +"4320" "Is the streetlamp open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4320.jpg" +"4321" "Is the streetlamp straight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4321.jpg" +"4322" "Is the streetlamp curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4322.jpg" +"4323" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4323.jpg" +"4324" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4324.jpg" +"4325" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4325.jpg" +"4326" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4326.jpg" +"4327" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4327.jpg" +"4328" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4328.jpg" +"4329" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4329.jpg" +"4330" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4330.jpg" +"4331" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4331.jpg" +"4332" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4332.jpg" +"4333" "Does the cat raise in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4333.jpg" +"4334" "Does the cat lower in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4334.jpg" +"4335" "Is there one brush in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4335.jpg" +"4336" "Are there two brushes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4336.jpg" +"4337" "Is the fence short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4337.jpg" +"4338" "Is the fence tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4338.jpg" +"4339" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4339.jpg" +"4340" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4340.jpg" +"4341" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4341.jpg" +"4342" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4342.jpg" +"4343" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4343.jpg" +"4344" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4344.jpg" +"4345" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4345.jpg" +"4346" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4346.jpg" +"4347" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4347.jpg" +"4348" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4348.jpg" +"4349" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4349.jpg" +"4350" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4350.jpg" +"4351" "Does the pigeon stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4351.jpg" +"4352" "Does the pigeon fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4352.jpg" +"4353" "Is there one telescope in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4353.jpg" +"4354" "Are there three telescopes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4354.jpg" +"4355" "Is the forest lush and verdant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4355.jpg" +"4356" "Is the forest falling yellow leaves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4356.jpg" +"4357" "Does the motorbike park in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4357.jpg" +"4358" "Does the motorbike drive in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4358.jpg" +"4359" "Are there two houses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4359.jpg" +"4360" "Are there six houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4360.jpg" +"4361" "Is the ground black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4361.jpg" +"4362" "Is the ground white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4362.jpg" +"4363" "Is there one cone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4363.jpg" +"4364" "Are there three cones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4364.jpg" +"4365" "Does the bus park in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4365.jpg" +"4366" "Does the bus drive in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4366.jpg" +"4367" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4367.jpg" +"4368" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4368.jpg" +"4369" "Is the floor patterned in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4369.jpg" +"4370" "Is the floor solid color in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4370.jpg" +"4371" "Does the person lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4371.jpg" +"4372" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4372.jpg" +"4373" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4373.jpg" +"4374" "Are there three toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4374.jpg" +"4375" "Is the bin silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4375.jpg" +"4376" "Is the bin blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4376.jpg" +"4377" "Is there one light in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4377.jpg" +"4378" "Are there three lights in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4378.jpg" +"4379" "Is the mirror irregular in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4379.jpg" +"4380" "Is the mirror round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4380.jpg" +"4381" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4381.jpg" +"4382" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4382.jpg" +"4383" "Is the plate round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4383.jpg" +"4384" "Is the plate square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4384.jpg" +"4385" "Is the pizza yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4385.jpg" +"4386" "Is the pizza red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4386.jpg" +"4387" "Is the cup white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4387.jpg" +"4388" "Is the cup black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4388.jpg" +"4389" "Does the person walking in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4389.jpg" +"4390" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4390.jpg" +"4391" "Is there one giraffe in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4391.jpg" +"4392" "Are there three giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4392.jpg" +"4393" "Is the forest rare in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4393.jpg" +"4394" "Is the forest dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4394.jpg" +"4395" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4395.jpg" +"4396" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4396.jpg" +"4397" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4397.jpg" +"4398" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4398.jpg" +"4399" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4399.jpg" +"4400" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4400.jpg" +"4401" "Is the apple 2 in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4401.jpg" +"4402" "Is the apple 5 in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4402.jpg" +"4403" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4403.jpg" +"4404" "Are there three knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4404.jpg" +"4405" "Is the table natural wood color in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4405.jpg" +"4406" "Is the table black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4406.jpg" +"4407" "Are there eight hots in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4407.jpg" +"4408" "Are there nine hots in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4408.jpg" +"4409" "Is there one grill in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4409.jpg" +"4410" "Are there three grills in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4410.jpg" +"4411" "Is the charcoal gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4411.jpg" +"4412" "Is the charcoal black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4412.jpg" +"4413" "Is the grass emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4413.jpg" +"4414" "Is the grass yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4414.jpg" +"4415" "Does the pigeon stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4415.jpg" +"4416" "Does the pigeon fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4416.jpg" +"4417" "Is the tree dead branches in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4417.jpg" +"4418" "Is the tree lush green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4418.jpg" +"4419" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4419.jpg" +"4420" "Is the sky pure white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4420.jpg" +"4421" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4421.jpg" +"4422" "Is the wall yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4422.jpg" +"4423" "Does the laptop open in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4423.jpg" +"4424" "Does the laptop close in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4424.jpg" +"4425" "Does the computer close in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4425.jpg" +"4426" "Does the computer open in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4426.jpg" +"4427" "Are there two wineglasses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4427.jpg" +"4428" "Are there three wineglasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4428.jpg" +"4429" "Is there one wine in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4429.jpg" +"4430" "Are there four wines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4430.jpg" +"4431" "Does the laptop open in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4431.jpg" +"4432" "Does the laptop close in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4432.jpg" +"4433" "Does the boy strike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4433.jpg" +"4434" "Does the boy sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4434.jpg" +"4435" "Is there one bat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4435.jpg" +"4436" "Are there three bats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4436.jpg" +"4437" "Is the ball fluorescent green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4437.jpg" +"4438" "Is the ball red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4438.jpg" +"4439" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4439.jpg" +"4440" "Does the man lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4440.jpg" +"4441" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4441.jpg" +"4442" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4442.jpg" +"4443" "Is the woman kick in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4443.jpg" +"4444" "Is the woman sit in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4444.jpg" +"4445" "Is the man stand in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4445.jpg" +"4446" "Is the man lie down in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4446.jpg" +"4447" "Is there one ball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4447.jpg" +"4448" "Are there three balls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4448.jpg" +"4449" "Is the flag yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4449.jpg" +"4450" "Is the flag red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4450.jpg" +"4451" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4451.jpg" +"4452" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4452.jpg" +"4453" "Does the electrombile park in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4453.jpg" +"4454" "Does the electrombile drive in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4454.jpg" +"4455" "Is the dog sit in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4455.jpg" +"4456" "Is the dog lie down in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4456.jpg" +"4457" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4457.jpg" +"4458" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4458.jpg" +"4459" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4459.jpg" +"4460" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4460.jpg" +"4461" "Is there one cake in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4461.jpg" +"4462" "Are there three cakes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4462.jpg" +"4463" "Is the fork silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4463.jpg" +"4464" "Is the fork blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4464.jpg" +"4465" "Is the plate round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4465.jpg" +"4466" "Is the plate square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4466.jpg" +"4467" "Is the table gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4467.jpg" +"4468" "Is the table black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4468.jpg" +"4469" "Are there five doughnuts in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4469.jpg" +"4470" "Are there six doughnuts in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4470.jpg" +"4471" "Is there one box in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4471.jpg" +"4472" "Are there three boxes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4472.jpg" +"4473" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4473.jpg" +"4474" "Are there three cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4474.jpg" +"4475" "Is the grass emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4475.jpg" +"4476" "Is the grass yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4476.jpg" +"4477" "Is the tree sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4477.jpg" +"4478" "Is the tree dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4478.jpg" +"4479" "Does the dog jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4479.jpg" +"4480" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4480.jpg" +"4481" "Is the toy red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4481.jpg" +"4482" "Is the toy yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4482.jpg" +"4483" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4483.jpg" +"4484" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4484.jpg" +"4485" "Does the boy crouch in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4485.jpg" +"4486" "Does the boy sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4486.jpg" +"4487" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4487.jpg" +"4488" "Are there three toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4488.jpg" +"4489" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4489.jpg" +"4490" "Is the sun gentle in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4490.jpg" +"4491" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4491.jpg" +"4492" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4492.jpg" +"4493" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4493.jpg" +"4494" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4494.jpg" +"4495" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4495.jpg" +"4496" "Is the snow gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4496.jpg" +"4497" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4497.jpg" +"4498" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4498.jpg" +"4499" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4499.jpg" +"4500" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4500.jpg" +"4501" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4501.jpg" +"4502" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4502.jpg" +"4503" "Is there one sign in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4503.jpg" +"4504" "Are there four signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4504.jpg" +"4505" "Is the tree sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4505.jpg" +"4506" "Is the tree dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4506.jpg" +"4507" "Is the cloud pure white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4507.jpg" +"4508" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4508.jpg" +"4509" "Are there two buses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4509.jpg" +"4510" "Are there six buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4510.jpg" +"4511" "Is the house yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4511.jpg" +"4512" "Is the house white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4512.jpg" +"4513" "Is the tree falling leaves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4513.jpg" +"4514" "Is the tree lush branches in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4514.jpg" +"4515" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4515.jpg" +"4516" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4516.jpg" +"4517" "Is the tree dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4517.jpg" +"4518" "Is the tree rare in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4518.jpg" +"4519" "Is the snow pristine in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4519.jpg" +"4520" "Is the snow filthy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4520.jpg" +"4521" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4521.jpg" +"4522" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4522.jpg" +"4523" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4523.jpg" +"4524" "Are there five hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4524.jpg" +"4525" "Does the bicycle park in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4525.jpg" +"4526" "Does the bicycle drive in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4526.jpg" +"4527" "Is the wall yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4527.jpg" +"4528" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4528.jpg" +"4529" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4529.jpg" +"4530" "Does the cat lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4530.jpg" +"4531" "Are there two luggages in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4531.jpg" +"4532" "Are there six luggages in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4532.jpg" +"4533" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4533.jpg" +"4534" "Is the wall gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4534.jpg" +"4535" "Is the floor wooden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4535.jpg" +"4536" "Is the floor tiled in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4536.jpg" +"4537" "Does the man half-squat in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4537.jpg" +"4538" "Does the man lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4538.jpg" +"4539" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4539.jpg" +"4540" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4540.jpg" +"4541" "Are there two buses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4541.jpg" +"4542" "Are there five buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4542.jpg" +"4543" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4543.jpg" +"4544" "Are there six people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4544.jpg" +"4545" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4545.jpg" +"4546" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4546.jpg" +"4547" "Is the forest sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4547.jpg" +"4548" "Is the forest dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4548.jpg" +"4549" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4549.jpg" +"4550" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4550.jpg" +"4551" "Is the grass emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4551.jpg" +"4552" "Is the grass yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4552.jpg" +"4553" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4553.jpg" +"4554" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4554.jpg" +"4555" "Does the person paddle in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4555.jpg" +"4556" "Does the person lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4556.jpg" +"4557" "Is the ship yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4557.jpg" +"4558" "Is the ship green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4558.jpg" +"4559" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4559.jpg" +"4560" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4560.jpg" +"4561" "Is the forest verdant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4561.jpg" +"4562" "Is the forest yellowing leaves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4562.jpg" +"4563" "Is the refrigerator white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4563.jpg" +"4564" "Is the refrigerator gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4564.jpg" +"4565" "Is there one microwave in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4565.jpg" +"4566" "Are there three microwaves in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4566.jpg" +"4567" "Is the socket white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4567.jpg" +"4568" "Is the socket yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4568.jpg" +"4569" "Is the wall tiled in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4569.jpg" +"4570" "Is the wall latex painted in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4570.jpg" +"4571" "Is there one bag in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4571.jpg" +"4572" "Are there three bags in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4572.jpg" +"4573" "Is the bag black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4573.jpg" +"4574" "Is the bag white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4574.jpg" +"4575" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4575.jpg" +"4576" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4576.jpg" +"4577" "Is the tomato red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4577.jpg" +"4578" "Is the tomato green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4578.jpg" +"4579" "Are there three carrots in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4579.jpg" +"4580" "Are there six carrots in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4580.jpg" +"4581" "Is the broccoli green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4581.jpg" +"4582" "Is the broccoli yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4582.jpg" +"4583" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4583.jpg" +"4584" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4584.jpg" +"4585" "Is the wall red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4585.jpg" +"4586" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4586.jpg" +"4587" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4587.jpg" +"4588" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4588.jpg" +"4589" "Is the sign inclined in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4589.jpg" +"4590" "Is the sign straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4590.jpg" +"4591" "Is the tree sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4591.jpg" +"4592" "Is the tree dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4592.jpg" +"4593" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4593.jpg" +"4594" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4594.jpg" +"4595" "Is the cloud pure white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4595.jpg" +"4596" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4596.jpg" +"4597" "Are there three books in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4597.jpg" +"4598" "Are there four books in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4598.jpg" +"4599" "Does the laptop open in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4599.jpg" +"4600" "Does the laptop close in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4600.jpg" +"4601" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4601.jpg" +"4602" "Is the keyboard black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4602.jpg" +"4603" "Is the mouse white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4603.jpg" +"4604" "Is the mouse pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4604.jpg" +"4605" "Is the wall solid color in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4605.jpg" +"4606" "Is the wall patterned in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4606.jpg" +"4607" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4607.jpg" +"4608" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4608.jpg" +"4609" "Is the horse white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4609.jpg" +"4610" "Is the horse black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4610.jpg" +"4611" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4611.jpg" +"4612" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4612.jpg" +"4613" "Is there one bed in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4613.jpg" +"4614" "Are there three beds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4614.jpg" +"4615" "Is there one quilt in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4615.jpg" +"4616" "Are there three quilts in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4616.jpg" +"4617" "Are there two pillows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4617.jpg" +"4618" "Are there five pillows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4618.jpg" +"4619" "Is the wall yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4619.jpg" +"4620" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4620.jpg" +"4621" "Is there one drawing in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4621.jpg" +"4622" "Are there four drawings in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4622.jpg" +"4623" "Is the apple red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4623.jpg" +"4624" "Is the apple green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4624.jpg" +"4625" "Is the orange yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4625.jpg" +"4626" "Is the orange green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4626.jpg" +"4627" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4627.jpg" +"4628" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4628.jpg" +"4629" "Is the ground muddy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4629.jpg" +"4630" "Is the ground concrete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4630.jpg" +"4631" "Are there three bananas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4631.jpg" +"4632" "Are there six bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4632.jpg" +"4633" "Are there two apples in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4633.jpg" +"4634" "Are there six apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4634.jpg" +"4635" "Is the plate round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4635.jpg" +"4636" "Is the plate square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4636.jpg" +"4637" "Are there two beds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4637.jpg" +"4638" "Are there three beds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4638.jpg" +"4639" "Are there two quilts in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4639.jpg" +"4640" "Are there four quilts in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4640.jpg" +"4641" "Is the wall striped in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4641.jpg" +"4642" "Is the wall solid color in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4642.jpg" +"4643" "Are there two lamps in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4643.jpg" +"4644" "Are there five lamps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4644.jpg" +"4645" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4645.jpg" +"4646" "Is the sun gentle in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4646.jpg" +"4647" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4647.jpg" +"4648" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4648.jpg" +"4649" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4649.jpg" +"4650" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4650.jpg" +"4651" "Is the snow pristine in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4651.jpg" +"4652" "Is the snow filthy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4652.jpg" +"4653" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4653.jpg" +"4654" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4654.jpg" +"4655" "Does the person slide in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4655.jpg" +"4656" "Does the person lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4656.jpg" +"4657" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4657.jpg" +"4658" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4658.jpg" +"4659" "Is the cloud pure white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4659.jpg" +"4660" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4660.jpg" +"4661" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4661.jpg" +"4662" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4662.jpg" +"4663" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4663.jpg" +"4664" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4664.jpg" +"4665" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4665.jpg" +"4666" "Is the grass rare in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4666.jpg" +"4667" "Is the train red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4667.jpg" +"4668" "Is the train white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4668.jpg" +"4669" "Is the sky overcast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4669.jpg" +"4670" "Is the sky sunny in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4670.jpg" +"4671" "Is the tree dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4671.jpg" +"4672" "Is the tree sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4672.jpg" +"4673" "Are there two boards in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4673.jpg" +"4674" "Are there six boards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4674.jpg" +"4675" "Does the train driving in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4675.jpg" +"4676" "Does the train stopped in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4676.jpg" +"4677" "Is the rail straight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4677.jpg" +"4678" "Is the rail curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4678.jpg" +"4679" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4679.jpg" +"4680" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4680.jpg" +"4681" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4681.jpg" +"4682" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4682.jpg" +"4683" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4683.jpg" +"4684" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4684.jpg" +"4685" "Are there two baggages in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4685.jpg" +"4686" "Are there five baggages in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4686.jpg" +"4687" "Is the floor tiled in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4687.jpg" +"4688" "Is the floor wooden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4688.jpg" +"4689" "Is there one cone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4689.jpg" +"4690" "Are there three cones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4690.jpg" +"4691" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4691.jpg" +"4692" "Are there five hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4692.jpg" +"4693" "Is the ground concrete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4693.jpg" +"4694" "Is the ground muddy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4694.jpg" +"4695" "Are there two zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4695.jpg" +"4696" "Are there six zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4696.jpg" +"4697" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4697.jpg" +"4698" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4698.jpg" +"4699" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4699.jpg" +"4700" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4700.jpg" +"4701" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4701.jpg" +"4702" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4702.jpg" +"4703" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4703.jpg" +"4704" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4704.jpg" +"4705" "Is the cherry red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4705.jpg" +"4706" "Is the cherry white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4706.jpg" +"4707" "Are there three oranges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4707.jpg" +"4708" "Are there six oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4708.jpg" +"4709" "Is the basin red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4709.jpg" +"4710" "Is the basin white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4710.jpg" +"4711" "Is the tree dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4711.jpg" +"4712" "Is the tree sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4712.jpg" +"4713" "Is the leave golden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4713.jpg" +"4714" "Is the leave black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4714.jpg" +"4715" "Is the ground dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4715.jpg" +"4716" "Is the ground clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4716.jpg" +"4717" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4717.jpg" +"4718" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4718.jpg" +"4719" "Is the streetlamp closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4719.jpg" +"4720" "Is the streetlamp open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4720.jpg" +"4721" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4721.jpg" +"4722" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4722.jpg" +"4723" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4723.jpg" +"4724" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4724.jpg" +"4725" "Is the rice white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4725.jpg" +"4726" "Is the rice black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4726.jpg" +"4727" "Is the broccoli green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4727.jpg" +"4728" "Is the broccoli pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4728.jpg" +"4729" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4729.jpg" +"4730" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4730.jpg" +"4731" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4731.jpg" +"4732" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4732.jpg" +"4733" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4733.jpg" +"4734" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4734.jpg" +"4735" "Are there four buses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4735.jpg" +"4736" "Are there five buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4736.jpg" +"4737" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4737.jpg" +"4738" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4738.jpg" +"4739" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4739.jpg" +"4740" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4740.jpg" +"4741" "Are there two buses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4741.jpg" +"4742" "Are there four buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4742.jpg" +"4743" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4743.jpg" +"4744" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4744.jpg" +"4745" "Is the road curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4745.jpg" +"4746" "Is the road straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4746.jpg" +"4747" "Is the sofa red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4747.jpg" +"4748" "Is the sofa white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4748.jpg" +"4749" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4749.jpg" +"4750" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4750.jpg" +"4751" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4751.jpg" +"4752" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4752.jpg" +"4753" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4753.jpg" +"4754" "Is the wall red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4754.jpg" +"4755" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4755.jpg" +"4756" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4756.jpg" +"4757" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4757.jpg" +"4758" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4758.jpg" +"4759" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4759.jpg" +"4760" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4760.jpg" +"4761" "Is the sea deep blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4761.jpg" +"4762" "Is the sea black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4762.jpg" +"4763" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4763.jpg" +"4764" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4764.jpg" +"4765" "Are there three tangerines in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4765.jpg" +"4766" "Are there four tangerines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4766.jpg" +"4767" "Are there two pears in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4767.jpg" +"4768" "Are there five pears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4768.jpg" +"4769" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4769.jpg" +"4770" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4770.jpg" +"4771" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4771.jpg" +"4772" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4772.jpg" +"4773" "Does the giraffe lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4773.jpg" +"4774" "Does the giraffe stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4774.jpg" +"4775" "Is the bush green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4775.jpg" +"4776" "Is the bush red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4776.jpg" +"4777" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4777.jpg" +"4778" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4778.jpg" +"4779" "Are there two sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4779.jpg" +"4780" "Are there three sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4780.jpg" +"4781" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4781.jpg" +"4782" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4782.jpg" +"4783" "Is the bus white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4783.jpg" +"4784" "Is the bus black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4784.jpg" +"4785" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4785.jpg" +"4786" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4786.jpg" +"4787" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4787.jpg" +"4788" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4788.jpg" +"4789" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4789.jpg" +"4790" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4790.jpg" +"4791" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4791.jpg" +"4792" "Are there eight people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4792.jpg" +"4793" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4793.jpg" +"4794" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4794.jpg" +"4795" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4795.jpg" +"4796" "Is the wall pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4796.jpg" +"4797" "Is the sofa red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4797.jpg" +"4798" "Is the sofa gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4798.jpg" +"4799" "Does the woman sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4799.jpg" +"4800" "Does the woman stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4800.jpg" +"4801" "Is the shoe black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4801.jpg" +"4802" "Is the shoe yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4802.jpg" +"4803" "Is the laptop white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4803.jpg" +"4804" "Is the laptop gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4804.jpg" +"4805" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4805.jpg" +"4806" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4806.jpg" +"4807" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4807.jpg" +"4808" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4808.jpg" +"4809" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4809.jpg" +"4810" "Are there eight people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4810.jpg" +"4811" "Is the laptop silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4811.jpg" +"4812" "Is the laptop black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4812.jpg" +"4813" "Are there two phones in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4813.jpg" +"4814" "Are there five phones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4814.jpg" +"4815" "Are there four chairs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4815.jpg" +"4816" "Are there five chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4816.jpg" +"4817" "Is the pad closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4817.jpg" +"4818" "Is the pad started in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4818.jpg" +"4819" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4819.jpg" +"4820" "Is the keyboard black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4820.jpg" +"4821" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4821.jpg" +"4822" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4822.jpg" +"4823" "Are there two breads in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4823.jpg" +"4824" "Are there four breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4824.jpg" +"4825" "Does the tree green in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4825.jpg" +"4826" "Does the tree yellow in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4826.jpg" +"4827" "Is the signal open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4827.jpg" +"4828" "Is the signal closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4828.jpg" +"4829" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4829.jpg" +"4830" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4830.jpg" +"4831" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4831.jpg" +"4832" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4832.jpg" +"4833" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4833.jpg" +"4834" "Is the tree gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4834.jpg" +"4835" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4835.jpg" +"4836" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4836.jpg" +"4837" "Is the signal open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4837.jpg" +"4838" "Is the signal closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4838.jpg" +"4839" "Is the sign square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4839.jpg" +"4840" "Is the sign round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4840.jpg" +"4841" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4841.jpg" +"4842" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4842.jpg" +"4843" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4843.jpg" +"4844" "Is the tree wither in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4844.jpg" +"4845" "Does the man squat in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4845.jpg" +"4846" "Does the man upright in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4846.jpg" +"4847" "Is the frisbee yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4847.jpg" +"4848" "Is the frisbee black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4848.jpg" +"4849" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4849.jpg" +"4850" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4850.jpg" +"4851" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4851.jpg" +"4852" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4852.jpg" +"4853" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4853.jpg" +"4854" "Is the forest yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4854.jpg" +"4855" "Are there five birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4855.jpg" +"4856" "Are there six birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4856.jpg" +"4857" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4857.jpg" +"4858" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4858.jpg" +"4859" "Is the tree red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4859.jpg" +"4860" "Is the tree green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4860.jpg" +"4861" "Is there one sign in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4861.jpg" +"4862" "Are there two signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4862.jpg" +"4863" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4863.jpg" +"4864" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4864.jpg" +"4865" "Is the light open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4865.jpg" +"4866" "Is the light close in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4866.jpg" +"4867" "Is the mirror square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4867.jpg" +"4868" "Is the mirror round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4868.jpg" +"4869" "Is the tap close in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4869.jpg" +"4870" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4870.jpg" +"4871" "Is there one sink in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4871.jpg" +"4872" "Are there two sinks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4872.jpg" +"4873" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4873.jpg" +"4874" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4874.jpg" +"4875" "Is the knife silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4875.jpg" +"4876" "Is the knife black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4876.jpg" +"4877" "Are there two forks in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4877.jpg" +"4878" "Are there three forks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4878.jpg" +"4879" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4879.jpg" +"4880" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4880.jpg" +"4881" "Is the pizza picturesque in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4881.jpg" +"4882" "Is the pizza plain-looking in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4882.jpg" +"4883" "Is the plate square in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4883.jpg" +"4884" "Is the plate round in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4884.jpg" +"4885" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4885.jpg" +"4886" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4886.jpg" +"4887" "Does the child kick in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4887.jpg" +"4888" "Does the child lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4888.jpg" +"4889" "Is there one ball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4889.jpg" +"4890" "Are there three balls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4890.jpg" +"4891" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4891.jpg" +"4892" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4892.jpg" +"4893" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4893.jpg" +"4894" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4894.jpg" +"4895" "Is the lake calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4895.jpg" +"4896" "Is the lake stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4896.jpg" +"4897" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4897.jpg" +"4898" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4898.jpg" +"4899" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4899.jpg" +"4900" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4900.jpg" +"4901" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4901.jpg" +"4902" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4902.jpg" +"4903" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4903.jpg" +"4904" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4904.jpg" +"4905" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4905.jpg" +"4906" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4906.jpg" +"4907" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4907.jpg" +"4908" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4908.jpg" +"4909" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4909.jpg" +"4910" "Is the sea turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4910.jpg" +"4911" "Is the train driving in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4911.jpg" +"4912" "Is the train stopped in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4912.jpg" +"4913" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4913.jpg" +"4914" "Is the forest yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4914.jpg" +"4915" "Does the person drive in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4915.jpg" +"4916" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4916.jpg" +"4917" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4917.jpg" +"4918" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4918.jpg" +"4919" "Are there two women in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4919.jpg" +"4920" "Are there seven women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4920.jpg" +"4921" "Does the laptop open in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4921.jpg" +"4922" "Does the laptop closed in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4922.jpg" +"4923" "Are there two coffees in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4923.jpg" +"4924" "Are there five coffees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4924.jpg" +"4925" "Is the scoon silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4925.jpg" +"4926" "Is the scoon yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4926.jpg" +"4927" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4927.jpg" +"4928" "Are there six bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4928.jpg" +"4929" "Does the giraffe stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4929.jpg" +"4930" "Does the giraffe lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4930.jpg" +"4931" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4931.jpg" +"4932" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4932.jpg" +"4933" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4933.jpg" +"4934" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4934.jpg" +"4935" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4935.jpg" +"4936" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4936.jpg" +"4937" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4937.jpg" +"4938" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4938.jpg" +"4939" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4939.jpg" +"4940" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4940.jpg" +"4941" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4941.jpg" +"4942" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4942.jpg" +"4943" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4943.jpg" +"4944" "Does the child run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4944.jpg" +"4945" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4945.jpg" +"4946" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4946.jpg" +"4947" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4947.jpg" +"4948" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4948.jpg" +"4949" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4949.jpg" +"4950" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4950.jpg" +"4951" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4951.jpg" +"4952" "Are there five people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4952.jpg" +"4953" "Does the child surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4953.jpg" +"4954" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4954.jpg" +"4955" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4955.jpg" +"4956" "Are there three surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4956.jpg" +"4957" "Is the sea restless in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4957.jpg" +"4958" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4958.jpg" +"4959" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4959.jpg" +"4960" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4960.jpg" +"4961" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4961.jpg" +"4962" "Are there three knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4962.jpg" +"4963" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4963.jpg" +"4964" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4964.jpg" +"4965" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4965.jpg" +"4966" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4966.jpg" +"4967" "Is the sea turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4967.jpg" +"4968" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4968.jpg" +"4969" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4969.jpg" +"4970" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4970.jpg" +"4971" "Does the dog lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4971.jpg" +"4972" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4972.jpg" +"4973" "Is there one doghole in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4973.jpg" +"4974" "Are there two dogholes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4974.jpg" +"4975" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4975.jpg" +"4976" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4976.jpg" +"4977" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4977.jpg" +"4978" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4978.jpg" +"4979" "Are there five breads in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4979.jpg" +"4980" "Are there eight breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4980.jpg" +"4981" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4981.jpg" +"4982" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4982.jpg" +"4983" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4983.jpg" +"4984" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4984.jpg" +"4985" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4985.jpg" +"4986" "Are there three cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4986.jpg" +"4987" "Does the horse stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4987.jpg" +"4988" "Does the horse sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4988.jpg" +"4989" "Is the road narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4989.jpg" +"4990" "Is the road wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4990.jpg" +"4991" "Is the fence short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4991.jpg" +"4992" "Is the fence tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4992.jpg" +"4993" "Is the forest withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4993.jpg" +"4994" "Is the forest lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4994.jpg" +"4995" "Is there one duck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4995.jpg" +"4996" "Are there two ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4996.jpg" +"4997" "Is the lake calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4997.jpg" +"4998" "Is the lake turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4998.jpg" +"4999" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/4999.jpg" +"5000" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5000.jpg" +"5001" "Is the sea calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5001.jpg" +"5002" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5002.jpg" +"5003" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5003.jpg" +"5004" "Is the wall yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5004.jpg" +"5005" "Is there one microwave in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5005.jpg" +"5006" "Are there two microwaves in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5006.jpg" +"5007" "Is there one pot in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5007.jpg" +"5008" "Are there three pots in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5008.jpg" +"5009" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5009.jpg" +"5010" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5010.jpg" +"5011" "Is there one house in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5011.jpg" +"5012" "Are there two houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5012.jpg" +"5013" "Are there three trees in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5013.jpg" +"5014" "Are there four trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5014.jpg" +"5015" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5015.jpg" +"5016" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5016.jpg" +"5017" "Is the flower fresh in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5017.jpg" +"5018" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5018.jpg" +"5019" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5019.jpg" +"5020" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5020.jpg" +"5021" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5021.jpg" +"5022" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5022.jpg" +"5023" "Is there one lamp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5023.jpg" +"5024" "Are there two lamps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5024.jpg" +"5025" "Does the cat sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5025.jpg" +"5026" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5026.jpg" +"5027" "Is the cable black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5027.jpg" +"5028" "Is the cable white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5028.jpg" +"5029" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5029.jpg" +"5030" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5030.jpg" +"5031" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5031.jpg" +"5032" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5032.jpg" +"5033" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5033.jpg" +"5034" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5034.jpg" +"5035" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5035.jpg" +"5036" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5036.jpg" +"5037" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5037.jpg" +"5038" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5038.jpg" +"5039" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5039.jpg" +"5040" "Are there three motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5040.jpg" +"5041" "Is the ground wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5041.jpg" +"5042" "Is the ground narrow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5042.jpg" +"5043" "Is the sign obvious in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5043.jpg" +"5044" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5044.jpg" +"5045" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5045.jpg" +"5046" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5046.jpg" +"5047" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5047.jpg" +"5048" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5048.jpg" +"5049" "Are there two cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5049.jpg" +"5050" "Are there three cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5050.jpg" +"5051" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5051.jpg" +"5052" "Are there five tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5052.jpg" +"5053" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5053.jpg" +"5054" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5054.jpg" +"5055" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5055.jpg" +"5056" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5056.jpg" +"5057" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5057.jpg" +"5058" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5058.jpg" +"5059" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5059.jpg" +"5060" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5060.jpg" +"5061" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5061.jpg" +"5062" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5062.jpg" +"5063" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5063.jpg" +"5064" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5064.jpg" +"5065" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5065.jpg" +"5066" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5066.jpg" +"5067" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5067.jpg" +"5068" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5068.jpg" +"5069" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5069.jpg" +"5070" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5070.jpg" +"5071" "Is the kite varied postures in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5071.jpg" +"5072" "Is the kite uniform in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5072.jpg" +"5073" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5073.jpg" +"5074" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5074.jpg" +"5075" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5075.jpg" +"5076" "Is the lake calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5076.jpg" +"5077" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5077.jpg" +"5078" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5078.jpg" +"5079" "Is the beach messy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5079.jpg" +"5080" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5080.jpg" +"5081" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5081.jpg" +"5082" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5082.jpg" +"5083" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5083.jpg" +"5084" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5084.jpg" +"5085" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5085.jpg" +"5086" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5086.jpg" +"5087" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5087.jpg" +"5088" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5088.jpg" +"5089" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5089.jpg" +"5090" "Is the sky yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5090.jpg" +"5091" "Is the mountain rugged mountains in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5091.jpg" +"5092" "Is the mountain flat as far as the eye can see in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5092.jpg" +"5093" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5093.jpg" +"5094" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5094.jpg" +"5095" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5095.jpg" +"5096" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5096.jpg" +"5097" "Does the elephant walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5097.jpg" +"5098" "Does the elephant run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5098.jpg" +"5099" "Are there two cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5099.jpg" +"5100" "Are there four cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5100.jpg" +"5101" "Is the ground smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5101.jpg" +"5102" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5102.jpg" +"5103" "Is the forest emerald in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5103.jpg" +"5104" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5104.jpg" +"5105" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5105.jpg" +"5106" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5106.jpg" +"5107" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5107.jpg" +"5108" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5108.jpg" +"5109" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5109.jpg" +"5110" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5110.jpg" +"5111" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5111.jpg" +"5112" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5112.jpg" +"5113" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5113.jpg" +"5114" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5114.jpg" +"5115" "Are there four people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5115.jpg" +"5116" "Are there six people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5116.jpg" +"5117" "Are there four horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5117.jpg" +"5118" "Are there six horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5118.jpg" +"5119" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5119.jpg" +"5120" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5120.jpg" +"5121" "Are there three birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5121.jpg" +"5122" "Are there five birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5122.jpg" +"5123" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5123.jpg" +"5124" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5124.jpg" +"5125" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5125.jpg" +"5126" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5126.jpg" +"5127" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5127.jpg" +"5128" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5128.jpg" +"5129" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5129.jpg" +"5130" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5130.jpg" +"5131" "Is the frisbee white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5131.jpg" +"5132" "Is the frisbee gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5132.jpg" +"5133" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5133.jpg" +"5134" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5134.jpg" +"5135" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5135.jpg" +"5136" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5136.jpg" +"5137" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5137.jpg" +"5138" "Is the forest yellowed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5138.jpg" +"5139" "Is the river gentle in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5139.jpg" +"5140" "Is the river rapid in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5140.jpg" +"5141" "Does the bear walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5141.jpg" +"5142" "Does the bear run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5142.jpg" +"5143" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5143.jpg" +"5144" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5144.jpg" +"5145" "Is the cloud gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5145.jpg" +"5146" "Is the cloud white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5146.jpg" +"5147" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5147.jpg" +"5148" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5148.jpg" +"5149" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5149.jpg" +"5150" "Is the sea calm in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5150.jpg" +"5151" "Is the toy yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5151.jpg" +"5152" "Is the toy blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5152.jpg" +"5153" "Is the ground smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5153.jpg" +"5154" "Is the ground uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5154.jpg" +"5155" "Does the dog lower in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5155.jpg" +"5156" "Does the dog raise in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5156.jpg" +"5157" "Is the skate black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5157.jpg" +"5158" "Is the skate white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5158.jpg" +"5159" "Is the toilet white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5159.jpg" +"5160" "Is the toilet black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5160.jpg" +"5161" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5161.jpg" +"5162" "Is the wall blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5162.jpg" +"5163" "Is the bin green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5163.jpg" +"5164" "Is the bin yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5164.jpg" +"5165" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5165.jpg" +"5166" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5166.jpg" +"5167" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5167.jpg" +"5168" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5168.jpg" +"5169" "Are there two kites in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5169.jpg" +"5170" "Are there four kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5170.jpg" +"5171" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5171.jpg" +"5172" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5172.jpg" +"5173" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5173.jpg" +"5174" "Does the cat run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5174.jpg" +"5175" "Is there one earphone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5175.jpg" +"5176" "Are there two earphones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5176.jpg" +"5177" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5177.jpg" +"5178" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5178.jpg" +"5179" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5179.jpg" +"5180" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5180.jpg" +"5181" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5181.jpg" +"5182" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5182.jpg" +"5183" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5183.jpg" +"5184" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5184.jpg" +"5185" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5185.jpg" +"5186" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5186.jpg" +"5187" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5187.jpg" +"5188" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5188.jpg" +"5189" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5189.jpg" +"5190" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5190.jpg" +"5191" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5191.jpg" +"5192" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5192.jpg" +"5193" "Does the person skiing in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5193.jpg" +"5194" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5194.jpg" +"5195" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5195.jpg" +"5196" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5196.jpg" +"5197" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5197.jpg" +"5198" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5198.jpg" +"5199" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5199.jpg" +"5200" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5200.jpg" +"5201" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5201.jpg" +"5202" "Is the plate green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5202.jpg" +"5203" "Is there one tangerine in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5203.jpg" +"5204" "Are there two tangerines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5204.jpg" +"5205" "Is there one orange in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5205.jpg" +"5206" "Are there three oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5206.jpg" +"5207" "Is the grape fresh in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5207.jpg" +"5208" "Is the grape decayed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5208.jpg" +"5209" "Is the grass lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5209.jpg" +"5210" "Is the grass in ruins in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5210.jpg" +"5211" "Are there two chickens in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5211.jpg" +"5212" "Are there three chickens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5212.jpg" +"5213" "Is the fence tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5213.jpg" +"5214" "Is the fence short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5214.jpg" +"5215" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5215.jpg" +"5216" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5216.jpg" +"5217" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5217.jpg" +"5218" "Is the sun soft in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5218.jpg" +"5219" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5219.jpg" +"5220" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5220.jpg" +"5221" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5221.jpg" +"5222" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5222.jpg" +"5223" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5223.jpg" +"5224" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5224.jpg" +"5225" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5225.jpg" +"5226" "Is the snow green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5226.jpg" +"5227" "Is the wall uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5227.jpg" +"5228" "Is the wall smooth in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5228.jpg" +"5229" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5229.jpg" +"5230" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5230.jpg" +"5231" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5231.jpg" +"5232" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5232.jpg" +"5233" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5233.jpg" +"5234" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5234.jpg" +"5235" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5235.jpg" +"5236" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5236.jpg" +"5237" "Are there two ducks in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5237.jpg" +"5238" "Are there three ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5238.jpg" +"5239" "Is there one pulp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5239.jpg" +"5240" "Are there two pulps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5240.jpg" +"5241" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5241.jpg" +"5242" "Does the person dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5242.jpg" +"5243" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5243.jpg" +"5244" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5244.jpg" +"5245" "Is the tree sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5245.jpg" +"5246" "Is the tree dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5246.jpg" +"5247" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5247.jpg" +"5248" "Is the grass on the brink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5248.jpg" +"5249" "Are there three giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5249.jpg" +"5250" "Are there four giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5250.jpg" +"5251" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5251.jpg" +"5252" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5252.jpg" +"5253" "Is the wall gray in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5253.jpg" +"5254" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5254.jpg" +"5255" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5255.jpg" +"5256" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5256.jpg" +"5257" "Is there one doll in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5257.jpg" +"5258" "Are there two dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5258.jpg" +"5259" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5259.jpg" +"5260" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5260.jpg" +"5261" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5261.jpg" +"5262" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5262.jpg" +"5263" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5263.jpg" +"5264" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5264.jpg" +"5265" "Is there one sunglasses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5265.jpg" +"5266" "Are there two sunglass in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5266.jpg" +"5267" "Is the glove black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5267.jpg" +"5268" "Is the glove white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5268.jpg" +"5269" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5269.jpg" +"5270" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5270.jpg" +"5271" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5271.jpg" +"5272" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5272.jpg" +"5273" "Is the plate yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5273.jpg" +"5274" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5274.jpg" +"5275" "Are there two bananas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5275.jpg" +"5276" "Are there three bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5276.jpg" +"5277" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5277.jpg" +"5278" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5278.jpg" +"5279" "Is the glass transparent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5279.jpg" +"5280" "Is the glass colored in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5280.jpg" +"5281" "Are there two eggs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5281.jpg" +"5282" "Are there three eggs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5282.jpg" +"5283" "Is there one scoon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5283.jpg" +"5284" "Are there two scoons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5284.jpg" +"5285" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5285.jpg" +"5286" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5286.jpg" +"5287" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5287.jpg" +"5288" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5288.jpg" +"5289" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5289.jpg" +"5290" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5290.jpg" +"5291" "Does the giraffe stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5291.jpg" +"5292" "Does the giraffe lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5292.jpg" +"5293" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5293.jpg" +"5294" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5294.jpg" +"5295" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5295.jpg" +"5296" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5296.jpg" +"5297" "Does the person jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5297.jpg" +"5298" "Does the person run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5298.jpg" +"5299" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5299.jpg" +"5300" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5300.jpg" +"5301" "Is there one tennis in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5301.jpg" +"5302" "Are there two tenni in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5302.jpg" +"5303" "Is the sky bright in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5303.jpg" +"5304" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5304.jpg" +"5305" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5305.jpg" +"5306" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5306.jpg" +"5307" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5307.jpg" +"5308" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5308.jpg" +"5309" "Are there two benches in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5309.jpg" +"5310" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5310.jpg" +"5311" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5311.jpg" +"5312" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5312.jpg" +"5313" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5313.jpg" +"5314" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5314.jpg" +"5315" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5315.jpg" +"5316" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5316.jpg" +"5317" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5317.jpg" +"5318" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5318.jpg" +"5319" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5319.jpg" +"5320" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5320.jpg" +"5321" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5321.jpg" +"5322" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5322.jpg" +"5323" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5323.jpg" +"5324" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5324.jpg" +"5325" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5325.jpg" +"5326" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5326.jpg" +"5327" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5327.jpg" +"5328" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5328.jpg" +"5329" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5329.jpg" +"5330" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5330.jpg" +"5331" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5331.jpg" +"5332" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5332.jpg" +"5333" "Is there one zebra in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5333.jpg" +"5334" "Are there two zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5334.jpg" +"5335" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5335.jpg" +"5336" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5336.jpg" +"5337" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5337.jpg" +"5338" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5338.jpg" +"5339" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5339.jpg" +"5340" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5340.jpg" +"5341" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5341.jpg" +"5342" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5342.jpg" +"5343" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5343.jpg" +"5344" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5344.jpg" +"5345" "Is the sign eye-catching in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5345.jpg" +"5346" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5346.jpg" +"5347" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5347.jpg" +"5348" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5348.jpg" +"5349" "Is the curtain good-looking in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5349.jpg" +"5350" "Is the curtain ugly in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5350.jpg" +"5351" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5351.jpg" +"5352" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5352.jpg" +"5353" "Are there three towels in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5353.jpg" +"5354" "Are there five towels in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5354.jpg" +"5355" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5355.jpg" +"5356" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5356.jpg" +"5357" "Is the cushion red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5357.jpg" +"5358" "Is the cushion black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5358.jpg" +"5359" "Is the tissue white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5359.jpg" +"5360" "Is the tissue pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5360.jpg" +"5361" "Is there one bear in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5361.jpg" +"5362" "Are there two bears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5362.jpg" +"5363" "Is the river turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5363.jpg" +"5364" "Is the river slow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5364.jpg" +"5365" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5365.jpg" +"5366" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5366.jpg" +"5367" "Does the horse stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5367.jpg" +"5368" "Does the horse lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5368.jpg" +"5369" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5369.jpg" +"5370" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5370.jpg" +"5371" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5371.jpg" +"5372" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5372.jpg" +"5373" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5373.jpg" +"5374" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5374.jpg" +"5375" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5375.jpg" +"5376" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5376.jpg" +"5377" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5377.jpg" +"5378" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5378.jpg" +"5379" "Is the tree lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5379.jpg" +"5380" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5380.jpg" +"5381" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5381.jpg" +"5382" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5382.jpg" +"5383" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5383.jpg" +"5384" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5384.jpg" +"5385" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5385.jpg" +"5386" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5386.jpg" +"5387" "Does the dog lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5387.jpg" +"5388" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5388.jpg" +"5389" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5389.jpg" +"5390" "Are there two tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5390.jpg" +"5391" "Is there one board in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5391.jpg" +"5392" "Are there two boards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5392.jpg" +"5393" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5393.jpg" +"5394" "Are there two knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5394.jpg" +"5395" "Is the carrot yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5395.jpg" +"5396" "Is the carrot white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5396.jpg" +"5397" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5397.jpg" +"5398" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5398.jpg" +"5399" "Is the rail straight in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5399.jpg" +"5400" "Is the rail curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5400.jpg" +"5401" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5401.jpg" +"5402" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5402.jpg" +"5403" "Is the river winding in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5403.jpg" +"5404" "Is the river straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5404.jpg" +"5405" "Is the sky overcast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5405.jpg" +"5406" "Is the sky bright in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5406.jpg" +"5407" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5407.jpg" +"5408" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5408.jpg" +"5409" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5409.jpg" +"5410" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5410.jpg" +"5411" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5411.jpg" +"5412" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5412.jpg" +"5413" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5413.jpg" +"5414" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5414.jpg" +"5415" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5415.jpg" +"5416" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5416.jpg" +"5417" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5417.jpg" +"5418" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5418.jpg" +"5419" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5419.jpg" +"5420" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5420.jpg" +"5421" "Are there two ships in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5421.jpg" +"5422" "Are there three ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5422.jpg" +"5423" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5423.jpg" +"5424" "Is the sea turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5424.jpg" +"5425" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5425.jpg" +"5426" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5426.jpg" +"5427" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5427.jpg" +"5428" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5428.jpg" +"5429" "Are there three apples in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5429.jpg" +"5430" "Are there four apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5430.jpg" +"5431" "Is the banana yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5431.jpg" +"5432" "Is the banana black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5432.jpg" +"5433" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5433.jpg" +"5434" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5434.jpg" +"5435" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5435.jpg" +"5436" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5436.jpg" +"5437" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5437.jpg" +"5438" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5438.jpg" +"5439" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5439.jpg" +"5440" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5440.jpg" +"5441" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5441.jpg" +"5442" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5442.jpg" +"5443" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5443.jpg" +"5444" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5444.jpg" +"5445" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5445.jpg" +"5446" "Is the cloud pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5446.jpg" +"5447" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5447.jpg" +"5448" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5448.jpg" +"5449" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5449.jpg" +"5450" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5450.jpg" +"5451" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5451.jpg" +"5452" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5452.jpg" +"5453" "Does the giraffe stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5453.jpg" +"5454" "Does the giraffe sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5454.jpg" +"5455" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5455.jpg" +"5456" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5456.jpg" +"5457" "Is the pizza damaged in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5457.jpg" +"5458" "Is the pizza complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5458.jpg" +"5459" "Are there three birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5459.jpg" +"5460" "Are there four birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5460.jpg" +"5461" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5461.jpg" +"5462" "Is the plate blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5462.jpg" +"5463" "Is the phone open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5463.jpg" +"5464" "Is the phone closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5464.jpg" +"5465" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5465.jpg" +"5466" "Are there two knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5466.jpg" +"5467" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5467.jpg" +"5468" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5468.jpg" +"5469" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5469.jpg" +"5470" "Is the forest red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5470.jpg" +"5471" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5471.jpg" +"5472" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5472.jpg" +"5473" "Does the lion walk in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5473.jpg" +"5474" "Does the lion jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5474.jpg" +"5475" "Are there two giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5475.jpg" +"5476" "Are there three giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5476.jpg" +"5477" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5477.jpg" +"5478" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5478.jpg" +"5479" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5479.jpg" +"5480" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5480.jpg" +"5481" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5481.jpg" +"5482" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5482.jpg" +"5483" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5483.jpg" +"5484" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5484.jpg" +"5485" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5485.jpg" +"5486" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5486.jpg" +"5487" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5487.jpg" +"5488" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5488.jpg" +"5489" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5489.jpg" +"5490" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5490.jpg" +"5491" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5491.jpg" +"5492" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5492.jpg" +"5493" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5493.jpg" +"5494" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5494.jpg" +"5495" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5495.jpg" +"5496" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5496.jpg" +"5497" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5497.jpg" +"5498" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5498.jpg" +"5499" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5499.jpg" +"5500" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5500.jpg" +"5501" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5501.jpg" +"5502" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5502.jpg" +"5503" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5503.jpg" +"5504" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5504.jpg" +"5505" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5505.jpg" +"5506" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5506.jpg" +"5507" "Is the bread round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5507.jpg" +"5508" "Is the bread square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5508.jpg" +"5509" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5509.jpg" +"5510" "Are there two knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5510.jpg" +"5511" "Is there one fork in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5511.jpg" +"5512" "Are there two forks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5512.jpg" +"5513" "Is the tissue white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5513.jpg" +"5514" "Is the tissue red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5514.jpg" +"5515" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5515.jpg" +"5516" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5516.jpg" +"5517" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5517.jpg" +"5518" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5518.jpg" +"5519" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5519.jpg" +"5520" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5520.jpg" +"5521" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5521.jpg" +"5522" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5522.jpg" +"5523" "Is there one lounge in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5523.jpg" +"5524" "Are there two lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5524.jpg" +"5525" "Is the plate black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5525.jpg" +"5526" "Is the plate white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5526.jpg" +"5527" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5527.jpg" +"5528" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5528.jpg" +"5529" "Are there two bananas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5529.jpg" +"5530" "Are there three bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5530.jpg" +"5531" "Is there one pear in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5531.jpg" +"5532" "Are there two pears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5532.jpg" +"5533" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5533.jpg" +"5534" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5534.jpg" +"5535" "Is there one bread in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5535.jpg" +"5536" "Are there two breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5536.jpg" +"5537" "Is there one fork in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5537.jpg" +"5538" "Are there two forks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5538.jpg" +"5539" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5539.jpg" +"5540" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5540.jpg" +"5541" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5541.jpg" +"5542" "Is the cloud red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5542.jpg" +"5543" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5543.jpg" +"5544" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5544.jpg" +"5545" "Is the ground sensory in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5545.jpg" +"5546" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5546.jpg" +"5547" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5547.jpg" +"5548" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5548.jpg" +"5549" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5549.jpg" +"5550" "Is the tree black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5550.jpg" +"5551" "Is the flag fluttering in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5551.jpg" +"5552" "Is the flag motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5552.jpg" +"5553" "Is there one giraffe in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5553.jpg" +"5554" "Are there two giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5554.jpg" +"5555" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5555.jpg" +"5556" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5556.jpg" +"5557" "Is the sea calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5557.jpg" +"5558" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5558.jpg" +"5559" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5559.jpg" +"5560" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5560.jpg" +"5561" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5561.jpg" +"5562" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5562.jpg" +"5563" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5563.jpg" +"5564" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5564.jpg" +"5565" "Does the person run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5565.jpg" +"5566" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5566.jpg" +"5567" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5567.jpg" +"5568" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5568.jpg" +"5569" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5569.jpg" +"5570" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5570.jpg" +"5571" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5571.jpg" +"5572" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5572.jpg" +"5573" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5573.jpg" +"5574" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5574.jpg" +"5575" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5575.jpg" +"5576" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5576.jpg" +"5577" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5577.jpg" +"5578" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5578.jpg" +"5579" "Is the sky bright in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5579.jpg" +"5580" "Is the sky dark in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5580.jpg" +"5581" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5581.jpg" +"5582" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5582.jpg" +"5583" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5583.jpg" +"5584" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5584.jpg" +"5585" "Is the rail curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5585.jpg" +"5586" "Is the rail straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5586.jpg" +"5587" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5587.jpg" +"5588" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5588.jpg" +"5589" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5589.jpg" +"5590" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5590.jpg" +"5591" "Is the computer open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5591.jpg" +"5592" "Is the computer closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5592.jpg" +"5593" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5593.jpg" +"5594" "Is the keyboard blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5594.jpg" +"5595" "Is there one laptop in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5595.jpg" +"5596" "Are there two laptops in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5596.jpg" +"5597" "Are there two cards in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5597.jpg" +"5598" "Are there three cards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5598.jpg" +"5599" "Is the cable white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5599.jpg" +"5600" "Is the cable black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5600.jpg" +"5601" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5601.jpg" +"5602" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5602.jpg" +"5603" "Is there one support in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5603.jpg" +"5604" "Are there two supports in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5604.jpg" +"5605" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5605.jpg" +"5606" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5606.jpg" +"5607" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5607.jpg" +"5608" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5608.jpg" +"5609" "Is the tree tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5609.jpg" +"5610" "Is the tree short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5610.jpg" +"5611" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5611.jpg" +"5612" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5612.jpg" +"5613" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5613.jpg" +"5614" "Are there six people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5614.jpg" +"5615" "Does the elephant stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5615.jpg" +"5616" "Does the elephant lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5616.jpg" +"5617" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5617.jpg" +"5618" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5618.jpg" +"5619" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5619.jpg" +"5620" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5620.jpg" +"5621" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5621.jpg" +"5622" "Are there three knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5622.jpg" +"5623" "Is the orange complete in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5623.jpg" +"5624" "Is the orange damaged in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5624.jpg" +"5625" "Is the forest lush in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5625.jpg" +"5626" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5626.jpg" +"5627" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5627.jpg" +"5628" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5628.jpg" +"5629" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5629.jpg" +"5630" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5630.jpg" +"5631" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5631.jpg" +"5632" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5632.jpg" +"5633" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5633.jpg" +"5634" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5634.jpg" +"5635" "Is the hat blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5635.jpg" +"5636" "Is the hat white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5636.jpg" +"5637" "Is there one baseball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5637.jpg" +"5638" "Are there two baseballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5638.jpg" +"5639" "Is there one baseball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5639.jpg" +"5640" "Are there two baseballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5640.jpg" +"5641" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5641.jpg" +"5642" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5642.jpg" +"5643" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5643.jpg" +"5644" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5644.jpg" +"5645" "Is the glove yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5645.jpg" +"5646" "Is the glove blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5646.jpg" +"5647" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5647.jpg" +"5648" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5648.jpg" +"5649" "Is there one blanket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5649.jpg" +"5650" "Are there two blankets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5650.jpg" +"5651" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5651.jpg" +"5652" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5652.jpg" +"5653" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5653.jpg" +"5654" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5654.jpg" +"5655" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5655.jpg" +"5656" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5656.jpg" +"5657" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5657.jpg" +"5658" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5658.jpg" +"5659" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5659.jpg" +"5660" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5660.jpg" +"5661" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5661.jpg" +"5662" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5662.jpg" +"5663" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5663.jpg" +"5664" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5664.jpg" +"5665" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5665.jpg" +"5666" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5666.jpg" +"5667" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5667.jpg" +"5668" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5668.jpg" +"5669" "Is the bridge simple in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5669.jpg" +"5670" "Is the bridge exquisite in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5670.jpg" +"5671" "Is the lake murky in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5671.jpg" +"5672" "Is the lake clear in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5672.jpg" +"5673" "Is the forest colorful in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5673.jpg" +"5674" "Is the forest dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5674.jpg" +"5675" "Is the monitor open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5675.jpg" +"5676" "Is the monitor closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5676.jpg" +"5677" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5677.jpg" +"5678" "Are there two mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5678.jpg" +"5679" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5679.jpg" +"5680" "Are there two keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5680.jpg" +"5681" "Is the cable messy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5681.jpg" +"5682" "Is the cable neat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5682.jpg" +"5683" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5683.jpg" +"5684" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5684.jpg" +"5685" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5685.jpg" +"5686" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5686.jpg" +"5687" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5687.jpg" +"5688" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5688.jpg" +"5689" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5689.jpg" +"5690" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5690.jpg" +"5691" "Does the person skiing in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5691.jpg" +"5692" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5692.jpg" +"5693" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5693.jpg" +"5694" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5694.jpg" +"5695" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5695.jpg" +"5696" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5696.jpg" +"5697" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5697.jpg" +"5698" "Is the sky blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5698.jpg" +"5699" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5699.jpg" +"5700" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5700.jpg" +"5701" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5701.jpg" +"5702" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5702.jpg" +"5703" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5703.jpg" +"5704" "Is the bath black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5704.jpg" +"5705" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5705.jpg" +"5706" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5706.jpg" +"5707" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5707.jpg" +"5708" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5708.jpg" +"5709" "Is there one showerhead in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5709.jpg" +"5710" "Are there two showerheads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5710.jpg" +"5711" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5711.jpg" +"5712" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5712.jpg" +"5713" "Is the sea stormy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5713.jpg" +"5714" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5714.jpg" +"5715" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5715.jpg" +"5716" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5716.jpg" +"5717" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5717.jpg" +"5718" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5718.jpg" +"5719" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5719.jpg" +"5720" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5720.jpg" +"5721" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5721.jpg" +"5722" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5722.jpg" +"5723" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5723.jpg" +"5724" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5724.jpg" +"5725" "Are there two horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5725.jpg" +"5726" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5726.jpg" +"5727" "Does the person horseback riding in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5727.jpg" +"5728" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5728.jpg" +"5729" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5729.jpg" +"5730" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5730.jpg" +"5731" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5731.jpg" +"5732" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5732.jpg" +"5733" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5733.jpg" +"5734" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5734.jpg" +"5735" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5735.jpg" +"5736" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5736.jpg" +"5737" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5737.jpg" +"5738" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5738.jpg" +"5739" "Are there two bears in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5739.jpg" +"5740" "Are there three bears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5740.jpg" +"5741" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5741.jpg" +"5742" "Is the tree red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5742.jpg" +"5743" "Is the guardrail short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5743.jpg" +"5744" "Is the guardrail tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5744.jpg" +"5745" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5745.jpg" +"5746" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5746.jpg" +"5747" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5747.jpg" +"5748" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5748.jpg" +"5749" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5749.jpg" +"5750" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5750.jpg" +"5751" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5751.jpg" +"5752" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5752.jpg" +"5753" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5753.jpg" +"5754" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5754.jpg" +"5755" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5755.jpg" +"5756" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5756.jpg" +"5757" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5757.jpg" +"5758" "Is the tree black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5758.jpg" +"5759" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5759.jpg" +"5760" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5760.jpg" +"5761" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5761.jpg" +"5762" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5762.jpg" +"5763" "Is the hat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5763.jpg" +"5764" "Is the hat blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5764.jpg" +"5765" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5765.jpg" +"5766" "Does the person dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5766.jpg" +"5767" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5767.jpg" +"5768" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5768.jpg" +"5769" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5769.jpg" +"5770" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5770.jpg" +"5771" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5771.jpg" +"5772" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5772.jpg" +"5773" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5773.jpg" +"5774" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5774.jpg" +"5775" "Is the sky bright in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5775.jpg" +"5776" "Is the sky dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5776.jpg" +"5777" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5777.jpg" +"5778" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5778.jpg" +"5779" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5779.jpg" +"5780" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5780.jpg" +"5781" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5781.jpg" +"5782" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5782.jpg" +"5783" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5783.jpg" +"5784" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5784.jpg" +"5785" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5785.jpg" +"5786" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5786.jpg" +"5787" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5787.jpg" +"5788" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5788.jpg" +"5789" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5789.jpg" +"5790" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5790.jpg" +"5791" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5791.jpg" +"5792" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5792.jpg" +"5793" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5793.jpg" +"5794" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5794.jpg" +"5795" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5795.jpg" +"5796" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5796.jpg" +"5797" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5797.jpg" +"5798" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5798.jpg" +"5799" "Is the banana yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5799.jpg" +"5800" "Is the banana green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5800.jpg" +"5801" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5801.jpg" +"5802" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5802.jpg" +"5803" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5803.jpg" +"5804" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5804.jpg" +"5805" "Is the mountain green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5805.jpg" +"5806" "Is the mountain yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5806.jpg" +"5807" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5807.jpg" +"5808" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5808.jpg" +"5809" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5809.jpg" +"5810" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5810.jpg" +"5811" "Is the lake calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5811.jpg" +"5812" "Is the lake stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5812.jpg" +"5813" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5813.jpg" +"5814" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5814.jpg" +"5815" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5815.jpg" +"5816" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5816.jpg" +"5817" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5817.jpg" +"5818" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5818.jpg" +"5819" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5819.jpg" +"5820" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5820.jpg" +"5821" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5821.jpg" +"5822" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5822.jpg" +"5823" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5823.jpg" +"5824" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5824.jpg" +"5825" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5825.jpg" +"5826" "Is the tree white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5826.jpg" +"5827" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5827.jpg" +"5828" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5828.jpg" +"5829" "Are there four motorbikes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5829.jpg" +"5830" "Are there six motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5830.jpg" +"5831" "Is the streetlamp open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5831.jpg" +"5832" "Is the streetlamp closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5832.jpg" +"5833" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5833.jpg" +"5834" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5834.jpg" +"5835" "Is there one pulp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5835.jpg" +"5836" "Are there two pulps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5836.jpg" +"5837" "Is the sea surging waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5837.jpg" +"5838" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5838.jpg" +"5839" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5839.jpg" +"5840" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5840.jpg" +"5841" "Is there one doll in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5841.jpg" +"5842" "Are there two dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5842.jpg" +"5843" "Is the chair white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5843.jpg" +"5844" "Is the chair black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5844.jpg" +"5845" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5845.jpg" +"5846" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5846.jpg" +"5847" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5847.jpg" +"5848" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5848.jpg" +"5849" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5849.jpg" +"5850" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5850.jpg" +"5851" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5851.jpg" +"5852" "Are there two mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5852.jpg" +"5853" "Is the apple green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5853.jpg" +"5854" "Is the apple red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5854.jpg" +"5855" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5855.jpg" +"5856" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5856.jpg" +"5857" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5857.jpg" +"5858" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5858.jpg" +"5859" "Are there two toothbrushes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5859.jpg" +"5860" "Are there three toothbrushes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5860.jpg" +"5861" "Is there one toothpaste in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5861.jpg" +"5862" "Are there two toothpastes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5862.jpg" +"5863" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5863.jpg" +"5864" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5864.jpg" +"5865" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5865.jpg" +"5866" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5866.jpg" +"5867" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5867.jpg" +"5868" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5868.jpg" +"5869" "Are there three pillows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5869.jpg" +"5870" "Are there four pillows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5870.jpg" +"5871" "Is there one doll in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5871.jpg" +"5872" "Are there two dolls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5872.jpg" +"5873" "Is the controller black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5873.jpg" +"5874" "Is the controller blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5874.jpg" +"5875" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5875.jpg" +"5876" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5876.jpg" +"5877" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5877.jpg" +"5878" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5878.jpg" +"5879" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5879.jpg" +"5880" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5880.jpg" +"5881" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5881.jpg" +"5882" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5882.jpg" +"5883" "Is the hat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5883.jpg" +"5884" "Is the hat white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5884.jpg" +"5885" "Is the glove black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5885.jpg" +"5886" "Is the glove red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5886.jpg" +"5887" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5887.jpg" +"5888" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5888.jpg" +"5889" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5889.jpg" +"5890" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5890.jpg" +"5891" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5891.jpg" +"5892" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5892.jpg" +"5893" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5893.jpg" +"5894" "Are there two mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5894.jpg" +"5895" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5895.jpg" +"5896" "Is the keyboard blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5896.jpg" +"5897" "Is the monitor open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5897.jpg" +"5898" "Is the monitor closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5898.jpg" +"5899" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5899.jpg" +"5900" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5900.jpg" +"5901" "Is there one notebook in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5901.jpg" +"5902" "Are there two notebooks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5902.jpg" +"5903" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5903.jpg" +"5904" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5904.jpg" +"5905" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5905.jpg" +"5906" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5906.jpg" +"5907" "Are there six tangerines in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5907.jpg" +"5908" "Are there seven tangerines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5908.jpg" +"5909" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5909.jpg" +"5910" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5910.jpg" +"5911" "Is the lemon yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5911.jpg" +"5912" "Is the lemon blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5912.jpg" +"5913" "Are there two ducks in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5913.jpg" +"5914" "Are there three ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5914.jpg" +"5915" "Is the river murky in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5915.jpg" +"5916" "Is the river clear in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5916.jpg" +"5917" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5917.jpg" +"5918" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5918.jpg" +"5919" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5919.jpg" +"5920" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5920.jpg" +"5921" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5921.jpg" +"5922" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5922.jpg" +"5923" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5923.jpg" +"5924" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5924.jpg" +"5925" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5925.jpg" +"5926" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5926.jpg" +"5927" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5927.jpg" +"5928" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5928.jpg" +"5929" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5929.jpg" +"5930" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5930.jpg" +"5931" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5931.jpg" +"5932" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5932.jpg" +"5933" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5933.jpg" +"5934" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5934.jpg" +"5935" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5935.jpg" +"5936" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5936.jpg" +"5937" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5937.jpg" +"5938" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5938.jpg" +"5939" "Is there one rack in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5939.jpg" +"5940" "Are there two racks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5940.jpg" +"5941" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5941.jpg" +"5942" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5942.jpg" +"5943" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5943.jpg" +"5944" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5944.jpg" +"5945" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5945.jpg" +"5946" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5946.jpg" +"5947" "Does the cat lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5947.jpg" +"5948" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5948.jpg" +"5949" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5949.jpg" +"5950" "Is the grass red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5950.jpg" +"5951" "Are there two breads in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5951.jpg" +"5952" "Are there three breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5952.jpg" +"5953" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5953.jpg" +"5954" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5954.jpg" +"5955" "Does the person jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5955.jpg" +"5956" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5956.jpg" +"5957" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5957.jpg" +"5958" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5958.jpg" +"5959" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5959.jpg" +"5960" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5960.jpg" +"5961" "Are there three bananas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5961.jpg" +"5962" "Are there four bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5962.jpg" +"5963" "Is the tangerine yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5963.jpg" +"5964" "Is the tangerine green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5964.jpg" +"5965" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5965.jpg" +"5966" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5966.jpg" +"5967" "Is the paper white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5967.jpg" +"5968" "Is the paper blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5968.jpg" +"5969" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5969.jpg" +"5970" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5970.jpg" +"5971" "Are there two pens in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5971.jpg" +"5972" "Are there six pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5972.jpg" +"5973" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5973.jpg" +"5974" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5974.jpg" +"5975" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5975.jpg" +"5976" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5976.jpg" +"5977" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5977.jpg" +"5978" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5978.jpg" +"5979" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5979.jpg" +"5980" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5980.jpg" +"5981" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5981.jpg" +"5982" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5982.jpg" +"5983" "Is the backpack black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5983.jpg" +"5984" "Is the backpack white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5984.jpg" +"5985" "Is there one mouse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5985.jpg" +"5986" "Are there two mice in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5986.jpg" +"5987" "Is the keyboard white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5987.jpg" +"5988" "Is the keyboard black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5988.jpg" +"5989" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5989.jpg" +"5990" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5990.jpg" +"5991" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5991.jpg" +"5992" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5992.jpg" +"5993" "Is there one elephant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5993.jpg" +"5994" "Are there two elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5994.jpg" +"5995" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5995.jpg" +"5996" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5996.jpg" +"5997" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5997.jpg" +"5998" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5998.jpg" +"5999" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/5999.jpg" +"6000" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6000.jpg" +"6001" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6001.jpg" +"6002" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6002.jpg" +"6003" "Are there two birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6003.jpg" +"6004" "Are there three birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6004.jpg" +"6005" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6005.jpg" +"6006" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6006.jpg" +"6007" "Are there three zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6007.jpg" +"6008" "Are there four zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6008.jpg" +"6009" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6009.jpg" +"6010" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6010.jpg" +"6011" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6011.jpg" +"6012" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6012.jpg" +"6013" "Does the cat lie down in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6013.jpg" +"6014" "Does the cat stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6014.jpg" +"6015" "Is there one controller in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6015.jpg" +"6016" "Are there two controllers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6016.jpg" +"6017" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6017.jpg" +"6018" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6018.jpg" +"6019" "Is the floor dirty in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6019.jpg" +"6020" "Is the floor clean in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6020.jpg" +"6021" "Is there one microwave in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6021.jpg" +"6022" "Are there two microwaves in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6022.jpg" +"6023" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6023.jpg" +"6024" "Are there two tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6024.jpg" +"6025" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6025.jpg" +"6026" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6026.jpg" +"6027" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6027.jpg" +"6028" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6028.jpg" +"6029" "Are there two giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6029.jpg" +"6030" "Are there three giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6030.jpg" +"6031" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6031.jpg" +"6032" "Is the tree white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6032.jpg" +"6033" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6033.jpg" +"6034" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6034.jpg" +"6035" "Is the blanket blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6035.jpg" +"6036" "Is the blanket black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6036.jpg" +"6037" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6037.jpg" +"6038" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6038.jpg" +"6039" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6039.jpg" +"6040" "Is the sea calm and waveless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6040.jpg" +"6041" "Is there one pulp in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6041.jpg" +"6042" "Are there two pulps in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6042.jpg" +"6043" "Does the person row a boat in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6043.jpg" +"6044" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6044.jpg" +"6045" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6045.jpg" +"6046" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6046.jpg" +"6047" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6047.jpg" +"6048" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6048.jpg" +"6049" "Is the ground curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6049.jpg" +"6050" "Is the ground straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6050.jpg" +"6051" "Is there one bus in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6051.jpg" +"6052" "Are there two buses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6052.jpg" +"6053" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6053.jpg" +"6054" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6054.jpg" +"6055" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6055.jpg" +"6056" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6056.jpg" +"6057" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6057.jpg" +"6058" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6058.jpg" +"6059" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6059.jpg" +"6060" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6060.jpg" +"6061" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6061.jpg" +"6062" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6062.jpg" +"6063" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6063.jpg" +"6064" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6064.jpg" +"6065" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6065.jpg" +"6066" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6066.jpg" +"6067" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6067.jpg" +"6068" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6068.jpg" +"6069" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6069.jpg" +"6070" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6070.jpg" +"6071" "Is the signal prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6071.jpg" +"6072" "Is the signal hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6072.jpg" +"6073" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6073.jpg" +"6074" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6074.jpg" +"6075" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6075.jpg" +"6076" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6076.jpg" +"6077" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6077.jpg" +"6078" "Does the person dance in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6078.jpg" +"6079" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6079.jpg" +"6080" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6080.jpg" +"6081" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6081.jpg" +"6082" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6082.jpg" +"6083" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6083.jpg" +"6084" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6084.jpg" +"6085" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6085.jpg" +"6086" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6086.jpg" +"6087" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6087.jpg" +"6088" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6088.jpg" +"6089" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6089.jpg" +"6090" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6090.jpg" +"6091" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6091.jpg" +"6092" "Does the person jump in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6092.jpg" +"6093" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6093.jpg" +"6094" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6094.jpg" +"6095" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6095.jpg" +"6096" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6096.jpg" +"6097" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6097.jpg" +"6098" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6098.jpg" +"6099" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6099.jpg" +"6100" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6100.jpg" +"6101" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6101.jpg" +"6102" "Is the tree blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6102.jpg" +"6103" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6103.jpg" +"6104" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6104.jpg" +"6105" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6105.jpg" +"6106" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6106.jpg" +"6107" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6107.jpg" +"6108" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6108.jpg" +"6109" "Is there one sign in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6109.jpg" +"6110" "Are there two signs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6110.jpg" +"6111" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6111.jpg" +"6112" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6112.jpg" +"6113" "Is the orange damaged in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6113.jpg" +"6114" "Is the orange complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6114.jpg" +"6115" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6115.jpg" +"6116" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6116.jpg" +"6117" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6117.jpg" +"6118" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6118.jpg" +"6119" "Are there five giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6119.jpg" +"6120" "Are there seven giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6120.jpg" +"6121" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6121.jpg" +"6122" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6122.jpg" +"6123" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6123.jpg" +"6124" "Is the forest red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6124.jpg" +"6125" "Is the river murky in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6125.jpg" +"6126" "Is the river clear in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6126.jpg" +"6127" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6127.jpg" +"6128" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6128.jpg" +"6129" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6129.jpg" +"6130" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6130.jpg" +"6131" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6131.jpg" +"6132" "Is the forest red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6132.jpg" +"6133" "Is the streetlamp open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6133.jpg" +"6134" "Is the streetlamp closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6134.jpg" +"6135" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6135.jpg" +"6136" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6136.jpg" +"6137" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6137.jpg" +"6138" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6138.jpg" +"6139" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6139.jpg" +"6140" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6140.jpg" +"6141" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6141.jpg" +"6142" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6142.jpg" +"6143" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6143.jpg" +"6144" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6144.jpg" +"6145" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6145.jpg" +"6146" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6146.jpg" +"6147" "Are there five people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6147.jpg" +"6148" "Are there six people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6148.jpg" +"6149" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6149.jpg" +"6150" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6150.jpg" +"6151" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6151.jpg" +"6152" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6152.jpg" +"6153" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6153.jpg" +"6154" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6154.jpg" +"6155" "Does the dog sleep in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6155.jpg" +"6156" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6156.jpg" +"6157" "Are there four controllers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6157.jpg" +"6158" "Are there five controllers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6158.jpg" +"6159" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6159.jpg" +"6160" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6160.jpg" +"6161" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6161.jpg" +"6162" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6162.jpg" +"6163" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6163.jpg" +"6164" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6164.jpg" +"6165" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6165.jpg" +"6166" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6166.jpg" +"6167" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6167.jpg" +"6168" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6168.jpg" +"6169" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6169.jpg" +"6170" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6170.jpg" +"6171" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6171.jpg" +"6172" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6172.jpg" +"6173" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6173.jpg" +"6174" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6174.jpg" +"6175" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6175.jpg" +"6176" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6176.jpg" +"6177" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6177.jpg" +"6178" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6178.jpg" +"6179" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6179.jpg" +"6180" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6180.jpg" +"6181" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6181.jpg" +"6182" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6182.jpg" +"6183" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6183.jpg" +"6184" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6184.jpg" +"6185" "Does the sky sunny in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6185.jpg" +"6186" "Does the sky gloomy in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6186.jpg" +"6187" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6187.jpg" +"6188" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6188.jpg" +"6189" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6189.jpg" +"6190" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6190.jpg" +"6191" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6191.jpg" +"6192" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6192.jpg" +"6193" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6193.jpg" +"6194" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6194.jpg" +"6195" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6195.jpg" +"6196" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6196.jpg" +"6197" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6197.jpg" +"6198" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6198.jpg" +"6199" "Is the sheep white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6199.jpg" +"6200" "Is the sheep black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6200.jpg" +"6201" "Is the fence short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6201.jpg" +"6202" "Is the fence tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6202.jpg" +"6203" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6203.jpg" +"6204" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6204.jpg" +"6205" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6205.jpg" +"6206" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6206.jpg" +"6207" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6207.jpg" +"6208" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6208.jpg" +"6209" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6209.jpg" +"6210" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6210.jpg" +"6211" "Are there two benches in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6211.jpg" +"6212" "Are there three benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6212.jpg" +"6213" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6213.jpg" +"6214" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6214.jpg" +"6215" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6215.jpg" +"6216" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6216.jpg" +"6217" "Is the broccoli green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6217.jpg" +"6218" "Is the broccoli blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6218.jpg" +"6219" "Is the cowpea green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6219.jpg" +"6220" "Is the cowpea black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6220.jpg" +"6221" "Is the shrimp ripe in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6221.jpg" +"6222" "Is the shrimp raw in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6222.jpg" +"6223" "Are there three oranges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6223.jpg" +"6224" "Are there four oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6224.jpg" +"6225" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6225.jpg" +"6226" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6226.jpg" +"6227" "Is the tree withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6227.jpg" +"6228" "Is the tree lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6228.jpg" +"6229" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6229.jpg" +"6230" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6230.jpg" +"6231" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6231.jpg" +"6232" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6232.jpg" +"6233" "Are there four people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6233.jpg" +"6234" "Are there five people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6234.jpg" +"6235" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6235.jpg" +"6236" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6236.jpg" +"6237" "Is the flag fluttering in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6237.jpg" +"6238" "Is the flag motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6238.jpg" +"6239" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6239.jpg" +"6240" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6240.jpg" +"6241" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6241.jpg" +"6242" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6242.jpg" +"6243" "Are there two oranges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6243.jpg" +"6244" "Are there three oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6244.jpg" +"6245" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6245.jpg" +"6246" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6246.jpg" +"6247" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6247.jpg" +"6248" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6248.jpg" +"6249" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6249.jpg" +"6250" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6250.jpg" +"6251" "Is there one tennis in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6251.jpg" +"6252" "Are there two tenni in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6252.jpg" +"6253" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6253.jpg" +"6254" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6254.jpg" +"6255" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6255.jpg" +"6256" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6256.jpg" +"6257" "Are there three frisbees in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6257.jpg" +"6258" "Are there four frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6258.jpg" +"6259" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6259.jpg" +"6260" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6260.jpg" +"6261" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6261.jpg" +"6262" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6262.jpg" +"6263" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6263.jpg" +"6264" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6264.jpg" +"6265" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6265.jpg" +"6266" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6266.jpg" +"6267" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6267.jpg" +"6268" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6268.jpg" +"6269" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6269.jpg" +"6270" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6270.jpg" +"6271" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6271.jpg" +"6272" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6272.jpg" +"6273" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6273.jpg" +"6274" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6274.jpg" +"6275" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6275.jpg" +"6276" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6276.jpg" +"6277" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6277.jpg" +"6278" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6278.jpg" +"6279" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6279.jpg" +"6280" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6280.jpg" +"6281" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6281.jpg" +"6282" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6282.jpg" +"6283" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6283.jpg" +"6284" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6284.jpg" +"6285" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6285.jpg" +"6286" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6286.jpg" +"6287" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6287.jpg" +"6288" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6288.jpg" +"6289" "Is the sky dim in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6289.jpg" +"6290" "Is the sky bright in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6290.jpg" +"6291" "Is the sea calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6291.jpg" +"6292" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6292.jpg" +"6293" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6293.jpg" +"6294" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6294.jpg" +"6295" "Are there three people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6295.jpg" +"6296" "Are there four people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6296.jpg" +"6297" "Are there two horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6297.jpg" +"6298" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6298.jpg" +"6299" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6299.jpg" +"6300" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6300.jpg" +"6301" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6301.jpg" +"6302" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6302.jpg" +"6303" "Is the pot green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6303.jpg" +"6304" "Is the pot white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6304.jpg" +"6305" "Is the book neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6305.jpg" +"6306" "Is the book messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6306.jpg" +"6307" "Is the computer open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6307.jpg" +"6308" "Is the computer closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6308.jpg" +"6309" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6309.jpg" +"6310" "Are there two keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6310.jpg" +"6311" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6311.jpg" +"6312" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6312.jpg" +"6313" "Is there one ring in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6313.jpg" +"6314" "Are there three rings in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6314.jpg" +"6315" "Is the cable messy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6315.jpg" +"6316" "Is the cable neat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6316.jpg" +"6317" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6317.jpg" +"6318" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6318.jpg" +"6319" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6319.jpg" +"6320" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6320.jpg" +"6321" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6321.jpg" +"6322" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6322.jpg" +"6323" "Is the road narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6323.jpg" +"6324" "Is the road wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6324.jpg" +"6325" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6325.jpg" +"6326" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6326.jpg" +"6327" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6327.jpg" +"6328" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6328.jpg" +"6329" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6329.jpg" +"6330" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6330.jpg" +"6331" "Are there two giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6331.jpg" +"6332" "Are there three giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6332.jpg" +"6333" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6333.jpg" +"6334" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6334.jpg" +"6335" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6335.jpg" +"6336" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6336.jpg" +"6337" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6337.jpg" +"6338" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6338.jpg" +"6339" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6339.jpg" +"6340" "Is the bath black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6340.jpg" +"6341" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6341.jpg" +"6342" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6342.jpg" +"6343" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6343.jpg" +"6344" "Is the tree black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6344.jpg" +"6345" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6345.jpg" +"6346" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6346.jpg" +"6347" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6347.jpg" +"6348" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6348.jpg" +"6349" "Are there three giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6349.jpg" +"6350" "Are there four giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6350.jpg" +"6351" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6351.jpg" +"6352" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6352.jpg" +"6353" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6353.jpg" +"6354" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6354.jpg" +"6355" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6355.jpg" +"6356" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6356.jpg" +"6357" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6357.jpg" +"6358" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6358.jpg" +"6359" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6359.jpg" +"6360" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6360.jpg" +"6361" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6361.jpg" +"6362" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6362.jpg" +"6363" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6363.jpg" +"6364" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6364.jpg" +"6365" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6365.jpg" +"6366" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6366.jpg" +"6367" "Is the tap open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6367.jpg" +"6368" "Is the tap closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6368.jpg" +"6369" "Is there one socket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6369.jpg" +"6370" "Are there two sockets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6370.jpg" +"6371" "Is the ground wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6371.jpg" +"6372" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6372.jpg" +"6373" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6373.jpg" +"6374" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6374.jpg" +"6375" "Is there one tennis in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6375.jpg" +"6376" "Are there two tenni in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6376.jpg" +"6377" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6377.jpg" +"6378" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6378.jpg" +"6379" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6379.jpg" +"6380" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6380.jpg" +"6381" "Is there one lemon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6381.jpg" +"6382" "Are there two lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6382.jpg" +"6383" "Is there one lemon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6383.jpg" +"6384" "Are there two lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6384.jpg" +"6385" "Is there one orange in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6385.jpg" +"6386" "Are there two oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6386.jpg" +"6387" "Is there one grapefruit in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6387.jpg" +"6388" "Are there two grapefruits in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6388.jpg" +"6389" "Is the hat white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6389.jpg" +"6390" "Is the hat blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6390.jpg" +"6391" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6391.jpg" +"6392" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6392.jpg" +"6393" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6393.jpg" +"6394" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6394.jpg" +"6395" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6395.jpg" +"6396" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6396.jpg" +"6397" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6397.jpg" +"6398" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6398.jpg" +"6399" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6399.jpg" +"6400" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6400.jpg" +"6401" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6401.jpg" +"6402" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6402.jpg" +"6403" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6403.jpg" +"6404" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6404.jpg" +"6405" "Is there one tangerine in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6405.jpg" +"6406" "Are there two tangerines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6406.jpg" +"6407" "Is the banana yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6407.jpg" +"6408" "Is the banana blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6408.jpg" +"6409" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6409.jpg" +"6410" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6410.jpg" +"6411" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6411.jpg" +"6412" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6412.jpg" +"6413" "Are there four horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6413.jpg" +"6414" "Are there five horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6414.jpg" +"6415" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6415.jpg" +"6416" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6416.jpg" +"6417" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6417.jpg" +"6418" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6418.jpg" +"6419" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6419.jpg" +"6420" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6420.jpg" +"6421" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6421.jpg" +"6422" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6422.jpg" +"6423" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6423.jpg" +"6424" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6424.jpg" +"6425" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6425.jpg" +"6426" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6426.jpg" +"6427" "Does the giraffe lower in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6427.jpg" +"6428" "Does the giraffe raise in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6428.jpg" +"6429" "Are there two zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6429.jpg" +"6430" "Are there three zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6430.jpg" +"6431" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6431.jpg" +"6432" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6432.jpg" +"6433" "Is the cat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6433.jpg" +"6434" "Is the cat white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6434.jpg" +"6435" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6435.jpg" +"6436" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6436.jpg" +"6437" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6437.jpg" +"6438" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6438.jpg" +"6439" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6439.jpg" +"6440" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6440.jpg" +"6441" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6441.jpg" +"6442" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6442.jpg" +"6443" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6443.jpg" +"6444" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6444.jpg" +"6445" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6445.jpg" +"6446" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6446.jpg" +"6447" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6447.jpg" +"6448" "Is the sea calm seas in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6448.jpg" +"6449" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6449.jpg" +"6450" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6450.jpg" +"6451" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6451.jpg" +"6452" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6452.jpg" +"6453" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6453.jpg" +"6454" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6454.jpg" +"6455" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6455.jpg" +"6456" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6456.jpg" +"6457" "Is there one keyboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6457.jpg" +"6458" "Are there two keyboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6458.jpg" +"6459" "Is the cup red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6459.jpg" +"6460" "Is the cup black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6460.jpg" +"6461" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6461.jpg" +"6462" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6462.jpg" +"6463" "Is the wall red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6463.jpg" +"6464" "Is the wall white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6464.jpg" +"6465" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6465.jpg" +"6466" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6466.jpg" +"6467" "Are there two potatoes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6467.jpg" +"6468" "Are there three potatoes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6468.jpg" +"6469" "Are there five carrots in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6469.jpg" +"6470" "Are there six carrots in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6470.jpg" +"6471" "Is the broccoli green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6471.jpg" +"6472" "Is the broccoli black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6472.jpg" +"6473" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6473.jpg" +"6474" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6474.jpg" +"6475" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6475.jpg" +"6476" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6476.jpg" +"6477" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6477.jpg" +"6478" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6478.jpg" +"6479" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6479.jpg" +"6480" "Is the sun soft in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6480.jpg" +"6481" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6481.jpg" +"6482" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6482.jpg" +"6483" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6483.jpg" +"6484" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6484.jpg" +"6485" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6485.jpg" +"6486" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6486.jpg" +"6487" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6487.jpg" +"6488" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6488.jpg" +"6489" "Is the kite dancing in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6489.jpg" +"6490" "Is the kite motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6490.jpg" +"6491" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6491.jpg" +"6492" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6492.jpg" +"6493" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6493.jpg" +"6494" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6494.jpg" +"6495" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6495.jpg" +"6496" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6496.jpg" +"6497" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6497.jpg" +"6498" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6498.jpg" +"6499" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6499.jpg" +"6500" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6500.jpg" +"6501" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6501.jpg" +"6502" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6502.jpg" +"6503" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6503.jpg" +"6504" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6504.jpg" +"6505" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6505.jpg" +"6506" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6506.jpg" +"6507" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6507.jpg" +"6508" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6508.jpg" +"6509" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6509.jpg" +"6510" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6510.jpg" +"6511" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6511.jpg" +"6512" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6512.jpg" +"6513" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6513.jpg" +"6514" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6514.jpg" +"6515" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6515.jpg" +"6516" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6516.jpg" +"6517" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6517.jpg" +"6518" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6518.jpg" +"6519" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6519.jpg" +"6520" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6520.jpg" +"6521" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6521.jpg" +"6522" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6522.jpg" +"6523" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6523.jpg" +"6524" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6524.jpg" +"6525" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6525.jpg" +"6526" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6526.jpg" +"6527" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6527.jpg" +"6528" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6528.jpg" +"6529" "Are there two sanitizers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6529.jpg" +"6530" "Are there three sanitizers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6530.jpg" +"6531" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6531.jpg" +"6532" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6532.jpg" +"6533" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6533.jpg" +"6534" "Is the sink black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6534.jpg" +"6535" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6535.jpg" +"6536" "Are there three cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6536.jpg" +"6537" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6537.jpg" +"6538" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6538.jpg" +"6539" "Is the door white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6539.jpg" +"6540" "Is the door black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6540.jpg" +"6541" "Is the carpet clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6541.jpg" +"6542" "Is the carpet dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6542.jpg" +"6543" "Is the carpet clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6543.jpg" +"6544" "Is the carpet dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6544.jpg" +"6545" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6545.jpg" +"6546" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6546.jpg" +"6547" "Is the cat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6547.jpg" +"6548" "Is the cat white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6548.jpg" +"6549" "Is the broccoli ripe in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6549.jpg" +"6550" "Is the broccoli raw in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6550.jpg" +"6551" "Is the tomato red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6551.jpg" +"6552" "Is the tomato white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6552.jpg" +"6553" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6553.jpg" +"6554" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6554.jpg" +"6555" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6555.jpg" +"6556" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6556.jpg" +"6557" "Are there two trains in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6557.jpg" +"6558" "Are there three trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6558.jpg" +"6559" "Is the rail complex in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6559.jpg" +"6560" "Is the rail simple in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6560.jpg" +"6561" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6561.jpg" +"6562" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6562.jpg" +"6563" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6563.jpg" +"6564" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6564.jpg" +"6565" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6565.jpg" +"6566" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6566.jpg" +"6567" "Is there one tangerine in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6567.jpg" +"6568" "Are there two tangerines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6568.jpg" +"6569" "Is there one lemon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6569.jpg" +"6570" "Are there two lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6570.jpg" +"6571" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6571.jpg" +"6572" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6572.jpg" +"6573" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6573.jpg" +"6574" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6574.jpg" +"6575" "Is the fence old in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6575.jpg" +"6576" "Is the fence brand new in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6576.jpg" +"6577" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6577.jpg" +"6578" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6578.jpg" +"6579" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6579.jpg" +"6580" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6580.jpg" +"6581" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6581.jpg" +"6582" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6582.jpg" +"6583" "Is there one zebra in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6583.jpg" +"6584" "Are there two zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6584.jpg" +"6585" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6585.jpg" +"6586" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6586.jpg" +"6587" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6587.jpg" +"6588" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6588.jpg" +"6589" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6589.jpg" +"6590" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6590.jpg" +"6591" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6591.jpg" +"6592" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6592.jpg" +"6593" "Is the sign obvious in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6593.jpg" +"6594" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6594.jpg" +"6595" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6595.jpg" +"6596" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6596.jpg" +"6597" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6597.jpg" +"6598" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6598.jpg" +"6599" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6599.jpg" +"6600" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6600.jpg" +"6601" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6601.jpg" +"6602" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6602.jpg" +"6603" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6603.jpg" +"6604" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6604.jpg" +"6605" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6605.jpg" +"6606" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6606.jpg" +"6607" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6607.jpg" +"6608" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6608.jpg" +"6609" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6609.jpg" +"6610" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6610.jpg" +"6611" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6611.jpg" +"6612" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6612.jpg" +"6613" "Is there one duck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6613.jpg" +"6614" "Are there two ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6614.jpg" +"6615" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6615.jpg" +"6616" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6616.jpg" +"6617" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6617.jpg" +"6618" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6618.jpg" +"6619" "Is there one bottle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6619.jpg" +"6620" "Are there two bottles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6620.jpg" +"6621" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6621.jpg" +"6622" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6622.jpg" +"6623" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6623.jpg" +"6624" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6624.jpg" +"6625" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6625.jpg" +"6626" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6626.jpg" +"6627" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6627.jpg" +"6628" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6628.jpg" +"6629" "Is the grass yellowed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6629.jpg" +"6630" "Is the grass white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6630.jpg" +"6631" "Are there two elephants in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6631.jpg" +"6632" "Are there three elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6632.jpg" +"6633" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6633.jpg" +"6634" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6634.jpg" +"6635" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6635.jpg" +"6636" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6636.jpg" +"6637" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6637.jpg" +"6638" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6638.jpg" +"6639" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6639.jpg" +"6640" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6640.jpg" +"6641" "Is there one racket in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6641.jpg" +"6642" "Are there two rackets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6642.jpg" +"6643" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6643.jpg" +"6644" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6644.jpg" +"6645" "Is there one zebra in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6645.jpg" +"6646" "Are there two zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6646.jpg" +"6647" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6647.jpg" +"6648" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6648.jpg" +"6649" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6649.jpg" +"6650" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6650.jpg" +"6651" "Is the refrigerator white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6651.jpg" +"6652" "Is the refrigerator black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6652.jpg" +"6653" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6653.jpg" +"6654" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6654.jpg" +"6655" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6655.jpg" +"6656" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6656.jpg" +"6657" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6657.jpg" +"6658" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6658.jpg" +"6659" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6659.jpg" +"6660" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6660.jpg" +"6661" "Is the sea rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6661.jpg" +"6662" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6662.jpg" +"6663" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6663.jpg" +"6664" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6664.jpg" +"6665" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6665.jpg" +"6666" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6666.jpg" +"6667" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6667.jpg" +"6668" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6668.jpg" +"6669" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6669.jpg" +"6670" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6670.jpg" +"6671" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6671.jpg" +"6672" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6672.jpg" +"6673" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6673.jpg" +"6674" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6674.jpg" +"6675" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6675.jpg" +"6676" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6676.jpg" +"6677" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6677.jpg" +"6678" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6678.jpg" +"6679" "Is the sea rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6679.jpg" +"6680" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6680.jpg" +"6681" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6681.jpg" +"6682" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6682.jpg" +"6683" "Are there three men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6683.jpg" +"6684" "Are there four men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6684.jpg" +"6685" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6685.jpg" +"6686" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6686.jpg" +"6687" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6687.jpg" +"6688" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6688.jpg" +"6689" "Is there one giraffe in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6689.jpg" +"6690" "Are there two giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6690.jpg" +"6691" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6691.jpg" +"6692" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6692.jpg" +"6693" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6693.jpg" +"6694" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6694.jpg" +"6695" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6695.jpg" +"6696" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6696.jpg" +"6697" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6697.jpg" +"6698" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6698.jpg" +"6699" "Are there four giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6699.jpg" +"6700" "Are there five giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6700.jpg" +"6701" "Does the dog run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6701.jpg" +"6702" "Does the dog sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6702.jpg" +"6703" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6703.jpg" +"6704" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6704.jpg" +"6705" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6705.jpg" +"6706" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6706.jpg" +"6707" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6707.jpg" +"6708" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6708.jpg" +"6709" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6709.jpg" +"6710" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6710.jpg" +"6711" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6711.jpg" +"6712" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6712.jpg" +"6713" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6713.jpg" +"6714" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6714.jpg" +"6715" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6715.jpg" +"6716" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6716.jpg" +"6717" "Is the kite dancing in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6717.jpg" +"6718" "Is the kite motionless in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6718.jpg" +"6719" "Are there three refrigerators in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6719.jpg" +"6720" "Are there four refrigerators in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6720.jpg" +"6721" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6721.jpg" +"6722" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6722.jpg" +"6723" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6723.jpg" +"6724" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6724.jpg" +"6725" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6725.jpg" +"6726" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6726.jpg" +"6727" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6727.jpg" +"6728" "Are there five people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6728.jpg" +"6729" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6729.jpg" +"6730" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6730.jpg" +"6731" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6731.jpg" +"6732" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6732.jpg" +"6733" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6733.jpg" +"6734" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6734.jpg" +"6735" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6735.jpg" +"6736" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6736.jpg" +"6737" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6737.jpg" +"6738" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6738.jpg" +"6739" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6739.jpg" +"6740" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6740.jpg" +"6741" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6741.jpg" +"6742" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6742.jpg" +"6743" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6743.jpg" +"6744" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6744.jpg" +"6745" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6745.jpg" +"6746" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6746.jpg" +"6747" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6747.jpg" +"6748" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6748.jpg" +"6749" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6749.jpg" +"6750" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6750.jpg" +"6751" "Is the sea rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6751.jpg" +"6752" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6752.jpg" +"6753" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6753.jpg" +"6754" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6754.jpg" +"6755" "Is the person horseback riding in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6755.jpg" +"6756" "Is the person swim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6756.jpg" +"6757" "Are there two horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6757.jpg" +"6758" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6758.jpg" +"6759" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6759.jpg" +"6760" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6760.jpg" +"6761" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6761.jpg" +"6762" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6762.jpg" +"6763" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6763.jpg" +"6764" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6764.jpg" +"6765" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6765.jpg" +"6766" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6766.jpg" +"6767" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6767.jpg" +"6768" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6768.jpg" +"6769" "Are there two hats in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6769.jpg" +"6770" "Are there three hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6770.jpg" +"6771" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6771.jpg" +"6772" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6772.jpg" +"6773" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6773.jpg" +"6774" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6774.jpg" +"6775" "Are there five elephants in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6775.jpg" +"6776" "Are there six elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6776.jpg" +"6777" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6777.jpg" +"6778" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6778.jpg" +"6779" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6779.jpg" +"6780" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6780.jpg" +"6781" "Is the bath white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6781.jpg" +"6782" "Is the bath black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6782.jpg" +"6783" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6783.jpg" +"6784" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6784.jpg" +"6785" "Is there one showerpuff in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6785.jpg" +"6786" "Are there two showerpuffs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6786.jpg" +"6787" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6787.jpg" +"6788" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6788.jpg" +"6789" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6789.jpg" +"6790" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6790.jpg" +"6791" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6791.jpg" +"6792" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6792.jpg" +"6793" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6793.jpg" +"6794" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6794.jpg" +"6795" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6795.jpg" +"6796" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6796.jpg" +"6797" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6797.jpg" +"6798" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6798.jpg" +"6799" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6799.jpg" +"6800" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6800.jpg" +"6801" "Does the child lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6801.jpg" +"6802" "Does the child stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6802.jpg" +"6803" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6803.jpg" +"6804" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6804.jpg" +"6805" "Are there six cows in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6805.jpg" +"6806" "Are there eight cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6806.jpg" +"6807" "Is the grass sparse in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6807.jpg" +"6808" "Is the grass dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6808.jpg" +"6809" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6809.jpg" +"6810" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6810.jpg" +"6811" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6811.jpg" +"6812" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6812.jpg" +"6813" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6813.jpg" +"6814" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6814.jpg" +"6815" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6815.jpg" +"6816" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6816.jpg" +"6817" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6817.jpg" +"6818" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6818.jpg" +"6819" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6819.jpg" +"6820" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6820.jpg" +"6821" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6821.jpg" +"6822" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6822.jpg" +"6823" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6823.jpg" +"6824" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6824.jpg" +"6825" "Is there one frisbee in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6825.jpg" +"6826" "Are there two frisbees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6826.jpg" +"6827" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6827.jpg" +"6828" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6828.jpg" +"6829" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6829.jpg" +"6830" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6830.jpg" +"6831" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6831.jpg" +"6832" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6832.jpg" +"6833" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6833.jpg" +"6834" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6834.jpg" +"6835" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6835.jpg" +"6836" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6836.jpg" +"6837" "Is there one core in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6837.jpg" +"6838" "Are there two cores in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6838.jpg" +"6839" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6839.jpg" +"6840" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6840.jpg" +"6841" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6841.jpg" +"6842" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6842.jpg" +"6843" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6843.jpg" +"6844" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6844.jpg" +"6845" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6845.jpg" +"6846" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6846.jpg" +"6847" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6847.jpg" +"6848" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6848.jpg" +"6849" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6849.jpg" +"6850" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6850.jpg" +"6851" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6851.jpg" +"6852" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6852.jpg" +"6853" "Are there two giraffes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6853.jpg" +"6854" "Are there three giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6854.jpg" +"6855" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6855.jpg" +"6856" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6856.jpg" +"6857" "Are there two glasses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6857.jpg" +"6858" "Are there five glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6858.jpg" +"6859" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6859.jpg" +"6860" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6860.jpg" +"6861" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6861.jpg" +"6862" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6862.jpg" +"6863" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6863.jpg" +"6864" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6864.jpg" +"6865" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6865.jpg" +"6866" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6866.jpg" +"6867" "Are there three horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6867.jpg" +"6868" "Are there four horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6868.jpg" +"6869" "Is the sky red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6869.jpg" +"6870" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6870.jpg" +"6871" "Is the sun round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6871.jpg" +"6872" "Is the sun square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6872.jpg" +"6873" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6873.jpg" +"6874" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6874.jpg" +"6875" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6875.jpg" +"6876" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6876.jpg" +"6877" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6877.jpg" +"6878" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6878.jpg" +"6879" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6879.jpg" +"6880" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6880.jpg" +"6881" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6881.jpg" +"6882" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6882.jpg" +"6883" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6883.jpg" +"6884" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6884.jpg" +"6885" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6885.jpg" +"6886" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6886.jpg" +"6887" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6887.jpg" +"6888" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6888.jpg" +"6889" "Are there two zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6889.jpg" +"6890" "Are there three zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6890.jpg" +"6891" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6891.jpg" +"6892" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6892.jpg" +"6893" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6893.jpg" +"6894" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6894.jpg" +"6895" "Is there one giraffe in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6895.jpg" +"6896" "Are there two giraffes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6896.jpg" +"6897" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6897.jpg" +"6898" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6898.jpg" +"6899" "Is there one cake in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6899.jpg" +"6900" "Are there two cakes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6900.jpg" +"6901" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6901.jpg" +"6902" "Are there two knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6902.jpg" +"6903" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6903.jpg" +"6904" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6904.jpg" +"6905" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6905.jpg" +"6906" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6906.jpg" +"6907" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6907.jpg" +"6908" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6908.jpg" +"6909" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6909.jpg" +"6910" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6910.jpg" +"6911" "Does the child jump in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6911.jpg" +"6912" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6912.jpg" +"6913" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6913.jpg" +"6914" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6914.jpg" +"6915" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6915.jpg" +"6916" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6916.jpg" +"6917" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6917.jpg" +"6918" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6918.jpg" +"6919" "Is there one panda in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6919.jpg" +"6920" "Are there two pandas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6920.jpg" +"6921" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6921.jpg" +"6922" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6922.jpg" +"6923" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6923.jpg" +"6924" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6924.jpg" +"6925" "Is the orange separated in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6925.jpg" +"6926" "Is the orange complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6926.jpg" +"6927" "Is the lemon yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6927.jpg" +"6928" "Is the lemon black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6928.jpg" +"6929" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6929.jpg" +"6930" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6930.jpg" +"6931" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6931.jpg" +"6932" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6932.jpg" +"6933" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6933.jpg" +"6934" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6934.jpg" +"6935" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6935.jpg" +"6936" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6936.jpg" +"6937" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6937.jpg" +"6938" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6938.jpg" +"6939" "Is there one goose in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6939.jpg" +"6940" "Are there two geese in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6940.jpg" +"6941" "Is the pizza round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6941.jpg" +"6942" "Is the pizza square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6942.jpg" +"6943" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6943.jpg" +"6944" "Is the plate blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6944.jpg" +"6945" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6945.jpg" +"6946" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6946.jpg" +"6947" "Are there five books in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6947.jpg" +"6948" "Are there six books in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6948.jpg" +"6949" "Is there one microwave in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6949.jpg" +"6950" "Are there two microwaves in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6950.jpg" +"6951" "Is there one bottle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6951.jpg" +"6952" "Are there two bottles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6952.jpg" +"6953" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6953.jpg" +"6954" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6954.jpg" +"6955" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6955.jpg" +"6956" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6956.jpg" +"6957" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6957.jpg" +"6958" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6958.jpg" +"6959" "Is the hydrant yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6959.jpg" +"6960" "Is the hydrant red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6960.jpg" +"6961" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6961.jpg" +"6962" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6962.jpg" +"6963" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6963.jpg" +"6964" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6964.jpg" +"6965" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6965.jpg" +"6966" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6966.jpg" +"6967" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6967.jpg" +"6968" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6968.jpg" +"6969" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6969.jpg" +"6970" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6970.jpg" +"6971" "Is there one elephant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6971.jpg" +"6972" "Are there two elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6972.jpg" +"6973" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6973.jpg" +"6974" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6974.jpg" +"6975" "Is there one vase in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6975.jpg" +"6976" "Are there two vases in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6976.jpg" +"6977" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6977.jpg" +"6978" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6978.jpg" +"6979" "Is the apple green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6979.jpg" +"6980" "Is the apple red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6980.jpg" +"6981" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6981.jpg" +"6982" "Is the forest wither in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6982.jpg" +"6983" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6983.jpg" +"6984" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6984.jpg" +"6985" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6985.jpg" +"6986" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6986.jpg" +"6987" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6987.jpg" +"6988" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6988.jpg" +"6989" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6989.jpg" +"6990" "Are there two toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6990.jpg" +"6991" "Is the tissue white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6991.jpg" +"6992" "Is the tissue black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6992.jpg" +"6993" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6993.jpg" +"6994" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6994.jpg" +"6995" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6995.jpg" +"6996" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6996.jpg" +"6997" "Is the frisbee pink in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6997.jpg" +"6998" "Is the frisbee yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6998.jpg" +"6999" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/6999.jpg" +"7000" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7000.jpg" +"7001" "Are there three parasails in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7001.jpg" +"7002" "Are there four parasails in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7002.jpg" +"7003" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7003.jpg" +"7004" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7004.jpg" +"7005" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7005.jpg" +"7006" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7006.jpg" +"7007" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7007.jpg" +"7008" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7008.jpg" +"7009" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7009.jpg" +"7010" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7010.jpg" +"7011" "Are there five elephants in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7011.jpg" +"7012" "Are there six elephants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7012.jpg" +"7013" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7013.jpg" +"7014" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7014.jpg" +"7015" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7015.jpg" +"7016" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7016.jpg" +"7017" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7017.jpg" +"7018" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7018.jpg" +"7019" "Does the man surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7019.jpg" +"7020" "Does the man swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7020.jpg" +"7021" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7021.jpg" +"7022" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7022.jpg" +"7023" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7023.jpg" +"7024" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7024.jpg" +"7025" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7025.jpg" +"7026" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7026.jpg" +"7027" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7027.jpg" +"7028" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7028.jpg" +"7029" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7029.jpg" +"7030" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7030.jpg" +"7031" "Is there one bread in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7031.jpg" +"7032" "Are there two breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7032.jpg" +"7033" "Is the tissue yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7033.jpg" +"7034" "Is the tissue blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7034.jpg" +"7035" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7035.jpg" +"7036" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7036.jpg" +"7037" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7037.jpg" +"7038" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7038.jpg" +"7039" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7039.jpg" +"7040" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7040.jpg" +"7041" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7041.jpg" +"7042" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7042.jpg" +"7043" "Is there one kite in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7043.jpg" +"7044" "Are there two kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7044.jpg" +"7045" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7045.jpg" +"7046" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7046.jpg" +"7047" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7047.jpg" +"7048" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7048.jpg" +"7049" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7049.jpg" +"7050" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7050.jpg" +"7051" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7051.jpg" +"7052" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7052.jpg" +"7053" "Is the lake sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7053.jpg" +"7054" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7054.jpg" +"7055" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7055.jpg" +"7056" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7056.jpg" +"7057" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7057.jpg" +"7058" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7058.jpg" +"7059" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7059.jpg" +"7060" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7060.jpg" +"7061" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7061.jpg" +"7062" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7062.jpg" +"7063" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7063.jpg" +"7064" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7064.jpg" +"7065" "Are there three wires in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7065.jpg" +"7066" "Are there four wires in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7066.jpg" +"7067" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7067.jpg" +"7068" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7068.jpg" +"7069" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7069.jpg" +"7070" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7070.jpg" +"7071" "Is the hat black in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7071.jpg" +"7072" "Is the hat white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7072.jpg" +"7073" "Is there one pizza in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7073.jpg" +"7074" "Are there two pizzas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7074.jpg" +"7075" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7075.jpg" +"7076" "Is the plate blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7076.jpg" +"7077" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7077.jpg" +"7078" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7078.jpg" +"7079" "Is there one tie in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7079.jpg" +"7080" "Are there two ties in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7080.jpg" +"7081" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7081.jpg" +"7082" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7082.jpg" +"7083" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7083.jpg" +"7084" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7084.jpg" +"7085" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7085.jpg" +"7086" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7086.jpg" +"7087" "Does the child stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7087.jpg" +"7088" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7088.jpg" +"7089" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7089.jpg" +"7090" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7090.jpg" +"7091" "Is there one bat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7091.jpg" +"7092" "Are there two bats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7092.jpg" +"7093" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7093.jpg" +"7094" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7094.jpg" +"7095" "Are there seven controllers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7095.jpg" +"7096" "Are there eight controllers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7096.jpg" +"7097" "Are there two sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7097.jpg" +"7098" "Are there three sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7098.jpg" +"7099" "Does the grass lush in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7099.jpg" +"7100" "Does the grass yellowed in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7100.jpg" +"7101" "Are there two zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7101.jpg" +"7102" "Are there three zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7102.jpg" +"7103" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7103.jpg" +"7104" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7104.jpg" +"7105" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7105.jpg" +"7106" "Is the tree yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7106.jpg" +"7107" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7107.jpg" +"7108" "Is the sky azure in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7108.jpg" +"7109" "Is the lamp open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7109.jpg" +"7110" "Is the lamp close in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7110.jpg" +"7111" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7111.jpg" +"7112" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7112.jpg" +"7113" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7113.jpg" +"7114" "Are there three pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7114.jpg" +"7115" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7115.jpg" +"7116" "Is the laptop close in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7116.jpg" +"7117" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7117.jpg" +"7118" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7118.jpg" +"7119" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7119.jpg" +"7120" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7120.jpg" +"7121" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7121.jpg" +"7122" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7122.jpg" +"7123" "Is the sky deep blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7123.jpg" +"7124" "Is the sky pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7124.jpg" +"7125" "Is the cloud pure white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7125.jpg" +"7126" "Is the cloud dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7126.jpg" +"7127" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7127.jpg" +"7128" "Is the sea turbulent in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7128.jpg" +"7129" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7129.jpg" +"7130" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7130.jpg" +"7131" "Does the person slide in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7131.jpg" +"7132" "Does the person lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7132.jpg" +"7133" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7133.jpg" +"7134" "Is the cloud gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7134.jpg" +"7135" "Are there two snowboards in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7135.jpg" +"7136" "Are there three snowboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7136.jpg" +"7137" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7137.jpg" +"7138" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7138.jpg" +"7139" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7139.jpg" +"7140" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7140.jpg" +"7141" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7141.jpg" +"7142" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7142.jpg" +"7143" "Is the lake calm seas in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7143.jpg" +"7144" "Is the lake stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7144.jpg" +"7145" "Is the sky azure in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7145.jpg" +"7146" "Is the sky gray in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7146.jpg" +"7147" "Is the cloud pristine in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7147.jpg" +"7148" "Is the cloud filthy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7148.jpg" +"7149" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7149.jpg" +"7150" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7150.jpg" +"7151" "Is the man sit in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7151.jpg" +"7152" "Is the man stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7152.jpg" +"7153" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7153.jpg" +"7154" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7154.jpg" +"7155" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7155.jpg" +"7156" "Is the grass lush green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7156.jpg" +"7157" "Does the bird stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7157.jpg" +"7158" "Does the bird fly in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7158.jpg" +"7159" "Is the grass lush green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7159.jpg" +"7160" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7160.jpg" +"7161" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7161.jpg" +"7162" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7162.jpg" +"7163" "Are there three birds in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7163.jpg" +"7164" "Are there four birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7164.jpg" +"7165" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7165.jpg" +"7166" "Is the grass yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7166.jpg" +"7167" "Does the woman walking in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7167.jpg" +"7168" "Does the woman lie down in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7168.jpg" +"7169" "Does the dog walking in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7169.jpg" +"7170" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7170.jpg" +"7171" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7171.jpg" +"7172" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7172.jpg" +"7173" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7173.jpg" +"7174" "Is the grass rare in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7174.jpg" +"7175" "Is the forest loose in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7175.jpg" +"7176" "Is the forest dense in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7176.jpg" +"7177" "Is the sky blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7177.jpg" +"7178" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7178.jpg" +"7179" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7179.jpg" +"7180" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7180.jpg" +"7181" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7181.jpg" +"7182" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7182.jpg" +"7183" "Are there five chairs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7183.jpg" +"7184" "Are there six chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7184.jpg" +"7185" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7185.jpg" +"7186" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7186.jpg" +"7187" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7187.jpg" +"7188" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7188.jpg" +"7189" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7189.jpg" +"7190" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7190.jpg" +"7191" "Is there one pizza in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7191.jpg" +"7192" "Are there two pizzas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7192.jpg" +"7193" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7193.jpg" +"7194" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7194.jpg" +"7195" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7195.jpg" +"7196" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7196.jpg" +"7197" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7197.jpg" +"7198" "Is the snow blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7198.jpg" +"7199" "Are there two motorbikes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7199.jpg" +"7200" "Are there three motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7200.jpg" +"7201" "Are there two men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7201.jpg" +"7202" "Are there three men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7202.jpg" +"7203" "Are there two glasses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7203.jpg" +"7204" "Are there three glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7204.jpg" +"7205" "Are there two hats in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7205.jpg" +"7206" "Are there three hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7206.jpg" +"7207" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7207.jpg" +"7208" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7208.jpg" +"7209" "Is the banana yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7209.jpg" +"7210" "Is the banana white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7210.jpg" +"7211" "Is the apple red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7211.jpg" +"7212" "Is the apple blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7212.jpg" +"7213" "Is the orange orange in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7213.jpg" +"7214" "Is the orange pink in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7214.jpg" +"7215" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7215.jpg" +"7216" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7216.jpg" +"7217" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7217.jpg" +"7218" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7218.jpg" +"7219" "Are there two trees in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7219.jpg" +"7220" "Are there three trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7220.jpg" +"7221" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7221.jpg" +"7222" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7222.jpg" +"7223" "Does the giraffe stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7223.jpg" +"7224" "Does the giraffe sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7224.jpg" +"7225" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7225.jpg" +"7226" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7226.jpg" +"7227" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7227.jpg" +"7228" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7228.jpg" +"7229" "Is there one motorbike in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7229.jpg" +"7230" "Are there two motorbikes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7230.jpg" +"7231" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7231.jpg" +"7232" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7232.jpg" +"7233" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7233.jpg" +"7234" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7234.jpg" +"7235" "Is the tangerine orange in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7235.jpg" +"7236" "Is the tangerine white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7236.jpg" +"7237" "Is the leave green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7237.jpg" +"7238" "Is the leave black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7238.jpg" +"7239" "Is the mouse white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7239.jpg" +"7240" "Is the mouse black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7240.jpg" +"7241" "Is there one mousepad in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7241.jpg" +"7242" "Are there two mousepads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7242.jpg" +"7243" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7243.jpg" +"7244" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7244.jpg" +"7245" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7245.jpg" +"7246" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7246.jpg" +"7247" "Is the tinfoil silver in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7247.jpg" +"7248" "Is the tinfoil black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7248.jpg" +"7249" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7249.jpg" +"7250" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7250.jpg" +"7251" "Is there one bread in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7251.jpg" +"7252" "Are there two breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7252.jpg" +"7253" "Is there one pear in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7253.jpg" +"7254" "Are there two pears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7254.jpg" +"7255" "Is the sofa comfortable in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7255.jpg" +"7256" "Is the sofa uncomfortable in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7256.jpg" +"7257" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7257.jpg" +"7258" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7258.jpg" +"7259" "Are there two toys in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7259.jpg" +"7260" "Are there three toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7260.jpg" +"7261" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7261.jpg" +"7262" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7262.jpg" +"7263" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7263.jpg" +"7264" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7264.jpg" +"7265" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7265.jpg" +"7266" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7266.jpg" +"7267" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7267.jpg" +"7268" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7268.jpg" +"7269" "Is the cat sit in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7269.jpg" +"7270" "Is the cat lie prone in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7270.jpg" +"7271" "Is the television open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7271.jpg" +"7272" "Is the television closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7272.jpg" +"7273" "Is there one cable in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7273.jpg" +"7274" "Are there two cables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7274.jpg" +"7275" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7275.jpg" +"7276" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7276.jpg" +"7277" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7277.jpg" +"7278" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7278.jpg" +"7279" "Are there two cats in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7279.jpg" +"7280" "Are there three cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7280.jpg" +"7281" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7281.jpg" +"7282" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7282.jpg" +"7283" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7283.jpg" +"7284" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7284.jpg" +"7285" "Is there one apple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7285.jpg" +"7286" "Are there two apples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7286.jpg" +"7287" "Is there one knife in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7287.jpg" +"7288" "Are there two knives in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7288.jpg" +"7289" "Is there one fork in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7289.jpg" +"7290" "Are there two forks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7290.jpg" +"7291" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7291.jpg" +"7292" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7292.jpg" +"7293" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7293.jpg" +"7294" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7294.jpg" +"7295" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7295.jpg" +"7296" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7296.jpg" +"7297" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7297.jpg" +"7298" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7298.jpg" +"7299" "Are there three men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7299.jpg" +"7300" "Are there four men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7300.jpg" +"7301" "Is there one football in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7301.jpg" +"7302" "Are there two footballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7302.jpg" +"7303" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7303.jpg" +"7304" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7304.jpg" +"7305" "Is there one clock in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7305.jpg" +"7306" "Are there two clocks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7306.jpg" +"7307" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7307.jpg" +"7308" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7308.jpg" +"7309" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7309.jpg" +"7310" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7310.jpg" +"7311" "Is there one umbrella in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7311.jpg" +"7312" "Are there two umbrellas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7312.jpg" +"7313" "Is the wall smooth in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7313.jpg" +"7314" "Is the wall rough in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7314.jpg" +"7315" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7315.jpg" +"7316" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7316.jpg" +"7317" "Is the cushion white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7317.jpg" +"7318" "Is the cushion black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7318.jpg" +"7319" "Is there one toilet in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7319.jpg" +"7320" "Are there two toilets in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7320.jpg" +"7321" "Is there one towel in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7321.jpg" +"7322" "Are there two towels in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7322.jpg" +"7323" "Is the sink white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7323.jpg" +"7324" "Is the sink blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7324.jpg" +"7325" "Is the tap closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7325.jpg" +"7326" "Is the tap open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7326.jpg" +"7327" "Is the banana yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7327.jpg" +"7328" "Is the banana white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7328.jpg" +"7329" "Is there one sticker in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7329.jpg" +"7330" "Are there two stickers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7330.jpg" +"7331" "Is the tangerine orange in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7331.jpg" +"7332" "Is the tangerine green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7332.jpg" +"7333" "Is the apple yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7333.jpg" +"7334" "Is the apple black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7334.jpg" +"7335" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7335.jpg" +"7336" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7336.jpg" +"7337" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7337.jpg" +"7338" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7338.jpg" +"7339" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7339.jpg" +"7340" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7340.jpg" +"7341" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7341.jpg" +"7342" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7342.jpg" +"7343" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7343.jpg" +"7344" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7344.jpg" +"7345" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7345.jpg" +"7346" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7346.jpg" +"7347" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7347.jpg" +"7348" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7348.jpg" +"7349" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7349.jpg" +"7350" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7350.jpg" +"7351" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7351.jpg" +"7352" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7352.jpg" +"7353" "Does the person stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7353.jpg" +"7354" "Does the person sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7354.jpg" +"7355" "Are there three kites in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7355.jpg" +"7356" "Are there four kites in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7356.jpg" +"7357" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7357.jpg" +"7358" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7358.jpg" +"7359" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7359.jpg" +"7360" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7360.jpg" +"7361" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7361.jpg" +"7362" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7362.jpg" +"7363" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7363.jpg" +"7364" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7364.jpg" +"7365" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7365.jpg" +"7366" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7366.jpg" +"7367" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7367.jpg" +"7368" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7368.jpg" +"7369" "Does the dog stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7369.jpg" +"7370" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7370.jpg" +"7371" "Is there one tennis in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7371.jpg" +"7372" "Are there two tenni in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7372.jpg" +"7373" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7373.jpg" +"7374" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7374.jpg" +"7375" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7375.jpg" +"7376" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7376.jpg" +"7377" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7377.jpg" +"7378" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7378.jpg" +"7379" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7379.jpg" +"7380" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7380.jpg" +"7381" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7381.jpg" +"7382" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7382.jpg" +"7383" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7383.jpg" +"7384" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7384.jpg" +"7385" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7385.jpg" +"7386" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7386.jpg" +"7387" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7387.jpg" +"7388" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7388.jpg" +"7389" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7389.jpg" +"7390" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7390.jpg" +"7391" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7391.jpg" +"7392" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7392.jpg" +"7393" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7393.jpg" +"7394" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7394.jpg" +"7395" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7395.jpg" +"7396" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7396.jpg" +"7397" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7397.jpg" +"7398" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7398.jpg" +"7399" "Is there one parasail in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7399.jpg" +"7400" "Are there two parasails in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7400.jpg" +"7401" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7401.jpg" +"7402" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7402.jpg" +"7403" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7403.jpg" +"7404" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7404.jpg" +"7405" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7405.jpg" +"7406" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7406.jpg" +"7407" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7407.jpg" +"7408" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7408.jpg" +"7409" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7409.jpg" +"7410" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7410.jpg" +"7411" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7411.jpg" +"7412" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7412.jpg" +"7413" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7413.jpg" +"7414" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7414.jpg" +"7415" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7415.jpg" +"7416" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7416.jpg" +"7417" "Does the man surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7417.jpg" +"7418" "Does the man swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7418.jpg" +"7419" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7419.jpg" +"7420" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7420.jpg" +"7421" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7421.jpg" +"7422" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7422.jpg" +"7423" "Is there one bear in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7423.jpg" +"7424" "Are there two bears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7424.jpg" +"7425" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7425.jpg" +"7426" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7426.jpg" +"7427" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7427.jpg" +"7428" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7428.jpg" +"7429" "Is the tree green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7429.jpg" +"7430" "Is the tree blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7430.jpg" +"7431" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7431.jpg" +"7432" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7432.jpg" +"7433" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7433.jpg" +"7434" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7434.jpg" +"7435" "Is there one hydrant in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7435.jpg" +"7436" "Are there two hydrants in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7436.jpg" +"7437" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7437.jpg" +"7438" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7438.jpg" +"7439" "Is the sky overcast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7439.jpg" +"7440" "Is the sky bright in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7440.jpg" +"7441" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7441.jpg" +"7442" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7442.jpg" +"7443" "Are there two ships in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7443.jpg" +"7444" "Are there three ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7444.jpg" +"7445" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7445.jpg" +"7446" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7446.jpg" +"7447" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7447.jpg" +"7448" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7448.jpg" +"7449" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7449.jpg" +"7450" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7450.jpg" +"7451" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7451.jpg" +"7452" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7452.jpg" +"7453" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7453.jpg" +"7454" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7454.jpg" +"7455" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7455.jpg" +"7456" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7456.jpg" +"7457" "Is there one box in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7457.jpg" +"7458" "Are there two boxes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7458.jpg" +"7459" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7459.jpg" +"7460" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7460.jpg" +"7461" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7461.jpg" +"7462" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7462.jpg" +"7463" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7463.jpg" +"7464" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7464.jpg" +"7465" "Is there one bench in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7465.jpg" +"7466" "Are there two benches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7466.jpg" +"7467" "Is the carpet clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7467.jpg" +"7468" "Is the carpet dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7468.jpg" +"7469" "Is there one tennis in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7469.jpg" +"7470" "Are there two tenni in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7470.jpg" +"7471" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7471.jpg" +"7472" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7472.jpg" +"7473" "Is there one bottle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7473.jpg" +"7474" "Are there two bottles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7474.jpg" +"7475" "Are there two breads in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7475.jpg" +"7476" "Are there three breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7476.jpg" +"7477" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7477.jpg" +"7478" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7478.jpg" +"7479" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7479.jpg" +"7480" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7480.jpg" +"7481" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7481.jpg" +"7482" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7482.jpg" +"7483" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7483.jpg" +"7484" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7484.jpg" +"7485" "Is there one train in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7485.jpg" +"7486" "Are there two trains in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7486.jpg" +"7487" "Is the tree withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7487.jpg" +"7488" "Is the tree lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7488.jpg" +"7489" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7489.jpg" +"7490" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7490.jpg" +"7491" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7491.jpg" +"7492" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7492.jpg" +"7493" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7493.jpg" +"7494" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7494.jpg" +"7495" "Are there four zebras in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7495.jpg" +"7496" "Are there five zebras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7496.jpg" +"7497" "Is there one toothbrush in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7497.jpg" +"7498" "Are there two toothbrushes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7498.jpg" +"7499" "Is there one toy in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7499.jpg" +"7500" "Are there two toys in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7500.jpg" +"7501" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7501.jpg" +"7502" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7502.jpg" +"7503" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7503.jpg" +"7504" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7504.jpg" +"7505" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7505.jpg" +"7506" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7506.jpg" +"7507" "Are there two horses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7507.jpg" +"7508" "Are there three horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7508.jpg" +"7509" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7509.jpg" +"7510" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7510.jpg" +"7511" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7511.jpg" +"7512" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7512.jpg" +"7513" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7513.jpg" +"7514" "Are there two tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7514.jpg" +"7515" "Are there three chairs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7515.jpg" +"7516" "Are there four chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7516.jpg" +"7517" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7517.jpg" +"7518" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7518.jpg" +"7519" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7519.jpg" +"7520" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7520.jpg" +"7521" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7521.jpg" +"7522" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7522.jpg" +"7523" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7523.jpg" +"7524" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7524.jpg" +"7525" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7525.jpg" +"7526" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7526.jpg" +"7527" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7527.jpg" +"7528" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7528.jpg" +"7529" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7529.jpg" +"7530" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7530.jpg" +"7531" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7531.jpg" +"7532" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7532.jpg" +"7533" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7533.jpg" +"7534" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7534.jpg" +"7535" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7535.jpg" +"7536" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7536.jpg" +"7537" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7537.jpg" +"7538" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7538.jpg" +"7539" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7539.jpg" +"7540" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7540.jpg" +"7541" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7541.jpg" +"7542" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7542.jpg" +"7543" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7543.jpg" +"7544" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7544.jpg" +"7545" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7545.jpg" +"7546" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7546.jpg" +"7547" "Is there one glass in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7547.jpg" +"7548" "Are there two glasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7548.jpg" +"7549" "Is the book open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7549.jpg" +"7550" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7550.jpg" +"7551" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7551.jpg" +"7552" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7552.jpg" +"7553" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7553.jpg" +"7554" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7554.jpg" +"7555" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7555.jpg" +"7556" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7556.jpg" +"7557" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7557.jpg" +"7558" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7558.jpg" +"7559" "Is there one eagle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7559.jpg" +"7560" "Are there two eagles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7560.jpg" +"7561" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7561.jpg" +"7562" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7562.jpg" +"7563" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7563.jpg" +"7564" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7564.jpg" +"7565" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7565.jpg" +"7566" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7566.jpg" +"7567" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7567.jpg" +"7568" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7568.jpg" +"7569" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7569.jpg" +"7570" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7570.jpg" +"7571" "Does the person ride a bike in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7571.jpg" +"7572" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7572.jpg" +"7573" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7573.jpg" +"7574" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7574.jpg" +"7575" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7575.jpg" +"7576" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7576.jpg" +"7577" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7577.jpg" +"7578" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7578.jpg" +"7579" "Is there one tie in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7579.jpg" +"7580" "Are there two ties in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7580.jpg" +"7581" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7581.jpg" +"7582" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7582.jpg" +"7583" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7583.jpg" +"7584" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7584.jpg" +"7585" "Is the sand vast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7585.jpg" +"7586" "Is the sand small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7586.jpg" +"7587" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7587.jpg" +"7588" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7588.jpg" +"7589" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7589.jpg" +"7590" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7590.jpg" +"7591" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7591.jpg" +"7592" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7592.jpg" +"7593" "Is the woman lie down in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7593.jpg" +"7594" "Is the woman stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7594.jpg" +"7595" "Is the star shiny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7595.jpg" +"7596" "Is the star dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7596.jpg" +"7597" "Is the sky beautiful in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7597.jpg" +"7598" "Is the sky ugly in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7598.jpg" +"7599" "Is the lake calm waters in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7599.jpg" +"7600" "Is the lake rolling waves in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7600.jpg" +"7601" "Is the sky overcast in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7601.jpg" +"7602" "Is the sky bright in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7602.jpg" +"7603" "Is the moon round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7603.jpg" +"7604" "Is the moon curved in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7604.jpg" +"7605" "Is the sun round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7605.jpg" +"7606" "Is the sun square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7606.jpg" +"7607" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7607.jpg" +"7608" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7608.jpg" +"7609" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7609.jpg" +"7610" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7610.jpg" +"7611" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7611.jpg" +"7612" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7612.jpg" +"7613" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7613.jpg" +"7614" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7614.jpg" +"7615" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7615.jpg" +"7616" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7616.jpg" +"7617" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7617.jpg" +"7618" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7618.jpg" +"7619" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7619.jpg" +"7620" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7620.jpg" +"7621" "Is there one cow in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7621.jpg" +"7622" "Are there two cows in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7622.jpg" +"7623" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7623.jpg" +"7624" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7624.jpg" +"7625" "Is the ground uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7625.jpg" +"7626" "Is the ground flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7626.jpg" +"7627" "Are there three sheep in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7627.jpg" +"7628" "Are there four sheep in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7628.jpg" +"7629" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7629.jpg" +"7630" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7630.jpg" +"7631" "Is the grape purple in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7631.jpg" +"7632" "Is the grape white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7632.jpg" +"7633" "Are there two wineglasses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7633.jpg" +"7634" "Are there three wineglasses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7634.jpg" +"7635" "Is there one wine in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7635.jpg" +"7636" "Are there two wines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7636.jpg" +"7637" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7637.jpg" +"7638" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7638.jpg" +"7639" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7639.jpg" +"7640" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7640.jpg" +"7641" "Does the child run in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7641.jpg" +"7642" "Does the child sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7642.jpg" +"7643" "Is the beach uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7643.jpg" +"7644" "Is the beach flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7644.jpg" +"7645" "Is there one pineapple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7645.jpg" +"7646" "Are there two pineapples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7646.jpg" +"7647" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7647.jpg" +"7648" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7648.jpg" +"7649" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7649.jpg" +"7650" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7650.jpg" +"7651" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7651.jpg" +"7652" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7652.jpg" +"7653" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7653.jpg" +"7654" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7654.jpg" +"7655" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7655.jpg" +"7656" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7656.jpg" +"7657" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7657.jpg" +"7658" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7658.jpg" +"7659" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7659.jpg" +"7660" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7660.jpg" +"7661" "Is there one tortoise in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7661.jpg" +"7662" "Are there two tortoises in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7662.jpg" +"7663" "Is the book open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7663.jpg" +"7664" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7664.jpg" +"7665" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7665.jpg" +"7666" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7666.jpg" +"7667" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7667.jpg" +"7668" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7668.jpg" +"7669" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7669.jpg" +"7670" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7670.jpg" +"7671" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7671.jpg" +"7672" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7672.jpg" +"7673" "Are there five houses in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7673.jpg" +"7674" "Are there six houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7674.jpg" +"7675" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7675.jpg" +"7676" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7676.jpg" +"7677" "Are there two chairs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7677.jpg" +"7678" "Are there three chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7678.jpg" +"7679" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7679.jpg" +"7680" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7680.jpg" +"7681" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7681.jpg" +"7682" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7682.jpg" +"7683" "Is there one bowl in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7683.jpg" +"7684" "Are there two bowls in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7684.jpg" +"7685" "Is the table neat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7685.jpg" +"7686" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7686.jpg" +"7687" "Is the chair 2 in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7687.jpg" +"7688" "Is the chair 3 in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7688.jpg" +"7689" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7689.jpg" +"7690" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7690.jpg" +"7691" "Is the refrigerator white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7691.jpg" +"7692" "Is the refrigerator black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7692.jpg" +"7693" "Are there two colas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7693.jpg" +"7694" "Are there three colas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7694.jpg" +"7695" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7695.jpg" +"7696" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7696.jpg" +"7697" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7697.jpg" +"7698" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7698.jpg" +"7699" "Is there one plane in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7699.jpg" +"7700" "Are there two planes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7700.jpg" +"7701" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7701.jpg" +"7702" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7702.jpg" +"7703" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7703.jpg" +"7704" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7704.jpg" +"7705" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7705.jpg" +"7706" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7706.jpg" +"7707" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7707.jpg" +"7708" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7708.jpg" +"7709" "Is the sun round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7709.jpg" +"7710" "Is the sun square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7710.jpg" +"7711" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7711.jpg" +"7712" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7712.jpg" +"7713" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7713.jpg" +"7714" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7714.jpg" +"7715" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7715.jpg" +"7716" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7716.jpg" +"7717" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7717.jpg" +"7718" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7718.jpg" +"7719" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7719.jpg" +"7720" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7720.jpg" +"7721" "Is there one tent in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7721.jpg" +"7722" "Are there two tents in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7722.jpg" +"7723" "Is the sea deep blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7723.jpg" +"7724" "Is the sea red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7724.jpg" +"7725" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7725.jpg" +"7726" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7726.jpg" +"7727" "Does the person swim in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7727.jpg" +"7728" "Does the person row a boat in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7728.jpg" +"7729" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7729.jpg" +"7730" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7730.jpg" +"7731" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7731.jpg" +"7732" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7732.jpg" +"7733" "Does the man sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7733.jpg" +"7734" "Does the man stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7734.jpg" +"7735" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7735.jpg" +"7736" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7736.jpg" +"7737" "Is the pad open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7737.jpg" +"7738" "Is the pad closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7738.jpg" +"7739" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7739.jpg" +"7740" "Are there two pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7740.jpg" +"7741" "Is there one watch in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7741.jpg" +"7742" "Are there two watches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7742.jpg" +"7743" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7743.jpg" +"7744" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7744.jpg" +"7745" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7745.jpg" +"7746" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7746.jpg" +"7747" "Is the guardrail sturdy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7747.jpg" +"7748" "Is the guardrail fragile in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7748.jpg" +"7749" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7749.jpg" +"7750" "Does the woman run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7750.jpg" +"7751" "Is there one bicycle in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7751.jpg" +"7752" "Are there two bicycles in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7752.jpg" +"7753" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7753.jpg" +"7754" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7754.jpg" +"7755" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7755.jpg" +"7756" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7756.jpg" +"7757" "Is the lake clear in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7757.jpg" +"7758" "Is the lake murky in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7758.jpg" +"7759" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7759.jpg" +"7760" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7760.jpg" +"7761" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7761.jpg" +"7762" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7762.jpg" +"7763" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7763.jpg" +"7764" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7764.jpg" +"7765" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7765.jpg" +"7766" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7766.jpg" +"7767" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7767.jpg" +"7768" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7768.jpg" +"7769" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7769.jpg" +"7770" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7770.jpg" +"7771" "Is there one horse in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7771.jpg" +"7772" "Are there two horses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7772.jpg" +"7773" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7773.jpg" +"7774" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7774.jpg" +"7775" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7775.jpg" +"7776" "Is the cloud red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7776.jpg" +"7777" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7777.jpg" +"7778" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7778.jpg" +"7779" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7779.jpg" +"7780" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7780.jpg" +"7781" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7781.jpg" +"7782" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7782.jpg" +"7783" "Is the umbrella open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7783.jpg" +"7784" "Is the umbrella closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7784.jpg" +"7785" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7785.jpg" +"7786" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7786.jpg" +"7787" "Are there two lounges in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7787.jpg" +"7788" "Are there three lounges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7788.jpg" +"7789" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7789.jpg" +"7790" "Are there two tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7790.jpg" +"7791" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7791.jpg" +"7792" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7792.jpg" +"7793" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7793.jpg" +"7794" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7794.jpg" +"7795" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7795.jpg" +"7796" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7796.jpg" +"7797" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7797.jpg" +"7798" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7798.jpg" +"7799" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7799.jpg" +"7800" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7800.jpg" +"7801" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7801.jpg" +"7802" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7802.jpg" +"7803" "Are there three ships in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7803.jpg" +"7804" "Are there four ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7804.jpg" +"7805" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7805.jpg" +"7806" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7806.jpg" +"7807" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7807.jpg" +"7808" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7808.jpg" +"7809" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7809.jpg" +"7810" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7810.jpg" +"7811" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7811.jpg" +"7812" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7812.jpg" +"7813" "Are there three pears in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7813.jpg" +"7814" "Are there four pears in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7814.jpg" +"7815" "Is the leave yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7815.jpg" +"7816" "Is the leave white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7816.jpg" +"7817" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7817.jpg" +"7818" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7818.jpg" +"7819" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7819.jpg" +"7820" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7820.jpg" +"7821" "Is the road curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7821.jpg" +"7822" "Is the road straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7822.jpg" +"7823" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7823.jpg" +"7824" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7824.jpg" +"7825" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7825.jpg" +"7826" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7826.jpg" +"7827" "Are there four trees in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7827.jpg" +"7828" "Are there five trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7828.jpg" +"7829" "Is there one banana in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7829.jpg" +"7830" "Are there two bananas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7830.jpg" +"7831" "Is there one bread in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7831.jpg" +"7832" "Are there two breads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7832.jpg" +"7833" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7833.jpg" +"7834" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7834.jpg" +"7835" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7835.jpg" +"7836" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7836.jpg" +"7837" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7837.jpg" +"7838" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7838.jpg" +"7839" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7839.jpg" +"7840" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7840.jpg" +"7841" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7841.jpg" +"7842" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7842.jpg" +"7843" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7843.jpg" +"7844" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7844.jpg" +"7845" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7845.jpg" +"7846" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7846.jpg" +"7847" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7847.jpg" +"7848" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7848.jpg" +"7849" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7849.jpg" +"7850" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7850.jpg" +"7851" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7851.jpg" +"7852" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7852.jpg" +"7853" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7853.jpg" +"7854" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7854.jpg" +"7855" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7855.jpg" +"7856" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7856.jpg" +"7857" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7857.jpg" +"7858" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7858.jpg" +"7859" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7859.jpg" +"7860" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7860.jpg" +"7861" "Are there two dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7861.jpg" +"7862" "Are there six dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7862.jpg" +"7863" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7863.jpg" +"7864" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7864.jpg" +"7865" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7865.jpg" +"7866" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7866.jpg" +"7867" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7867.jpg" +"7868" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7868.jpg" +"7869" "Is there one deer in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7869.jpg" +"7870" "Are there two deer in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7870.jpg" +"7871" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7871.jpg" +"7872" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7872.jpg" +"7873" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7873.jpg" +"7874" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7874.jpg" +"7875" "Are there two balloons in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7875.jpg" +"7876" "Are there three balloons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7876.jpg" +"7877" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7877.jpg" +"7878" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7878.jpg" +"7879" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7879.jpg" +"7880" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7880.jpg" +"7881" "Is the building tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7881.jpg" +"7882" "Is the building short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7882.jpg" +"7883" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7883.jpg" +"7884" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7884.jpg" +"7885" "Does the person surf in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7885.jpg" +"7886" "Does the person swim in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7886.jpg" +"7887" "Is there one surfboard in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7887.jpg" +"7888" "Are there two surfboards in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7888.jpg" +"7889" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7889.jpg" +"7890" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7890.jpg" +"7891" "Is there one flower in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7891.jpg" +"7892" "Are there two flowers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7892.jpg" +"7893" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7893.jpg" +"7894" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7894.jpg" +"7895" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7895.jpg" +"7896" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7896.jpg" +"7897" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7897.jpg" +"7898" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7898.jpg" +"7899" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7899.jpg" +"7900" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7900.jpg" +"7901" "Is the forest yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7901.jpg" +"7902" "Is the forest white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7902.jpg" +"7903" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7903.jpg" +"7904" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7904.jpg" +"7905" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7905.jpg" +"7906" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7906.jpg" +"7907" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7907.jpg" +"7908" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7908.jpg" +"7909" "Is the sea blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7909.jpg" +"7910" "Is the sea black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7910.jpg" +"7911" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7911.jpg" +"7912" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7912.jpg" +"7913" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7913.jpg" +"7914" "Are there two pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7914.jpg" +"7915" "Is there one notebook in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7915.jpg" +"7916" "Are there two notebooks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7916.jpg" +"7917" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7917.jpg" +"7918" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7918.jpg" +"7919" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7919.jpg" +"7920" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7920.jpg" +"7921" "Is the train blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7921.jpg" +"7922" "Is the train white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7922.jpg" +"7923" "Is the forest dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7923.jpg" +"7924" "Is the forest sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7924.jpg" +"7925" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7925.jpg" +"7926" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7926.jpg" +"7927" "Is there one cat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7927.jpg" +"7928" "Are there two cats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7928.jpg" +"7929" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7929.jpg" +"7930" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7930.jpg" +"7931" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7931.jpg" +"7932" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7932.jpg" +"7933" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7933.jpg" +"7934" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7934.jpg" +"7935" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7935.jpg" +"7936" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7936.jpg" +"7937" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7937.jpg" +"7938" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7938.jpg" +"7939" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7939.jpg" +"7940" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7940.jpg" +"7941" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7941.jpg" +"7942" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7942.jpg" +"7943" "Is the desert dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7943.jpg" +"7944" "Is the desert wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7944.jpg" +"7945" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7945.jpg" +"7946" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7946.jpg" +"7947" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7947.jpg" +"7948" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7948.jpg" +"7949" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7949.jpg" +"7950" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7950.jpg" +"7951" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7951.jpg" +"7952" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7952.jpg" +"7953" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7953.jpg" +"7954" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7954.jpg" +"7955" "Is the sky white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7955.jpg" +"7956" "Is the sky black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7956.jpg" +"7957" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7957.jpg" +"7958" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7958.jpg" +"7959" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7959.jpg" +"7960" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7960.jpg" +"7961" "Are there two shoes in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7961.jpg" +"7962" "Are there three shoes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7962.jpg" +"7963" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7963.jpg" +"7964" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7964.jpg" +"7965" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7965.jpg" +"7966" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7966.jpg" +"7967" "Is there one camera in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7967.jpg" +"7968" "Are there two cameras in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7968.jpg" +"7969" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7969.jpg" +"7970" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7970.jpg" +"7971" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7971.jpg" +"7972" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7972.jpg" +"7973" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7973.jpg" +"7974" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7974.jpg" +"7975" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7975.jpg" +"7976" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7976.jpg" +"7977" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7977.jpg" +"7978" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7978.jpg" +"7979" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7979.jpg" +"7980" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7980.jpg" +"7981" "Is there one phone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7981.jpg" +"7982" "Are there two phones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7982.jpg" +"7983" "Is there one pad in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7983.jpg" +"7984" "Are there two pads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7984.jpg" +"7985" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7985.jpg" +"7986" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7986.jpg" +"7987" "Is there one fox in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7987.jpg" +"7988" "Are there two foxes in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7988.jpg" +"7989" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7989.jpg" +"7990" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7990.jpg" +"7991" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7991.jpg" +"7992" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7992.jpg" +"7993" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7993.jpg" +"7994" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7994.jpg" +"7995" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7995.jpg" +"7996" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7996.jpg" +"7997" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7997.jpg" +"7998" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7998.jpg" +"7999" "Is there one goose in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/7999.jpg" +"8000" "Are there two geese in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8000.jpg" +"8001" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8001.jpg" +"8002" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8002.jpg" +"8003" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8003.jpg" +"8004" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8004.jpg" +"8005" "Is there one lemon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8005.jpg" +"8006" "Are there two lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8006.jpg" +"8007" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8007.jpg" +"8008" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8008.jpg" +"8009" "Is the tree tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8009.jpg" +"8010" "Is the tree short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8010.jpg" +"8011" "Is there one woman in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8011.jpg" +"8012" "Are there two women in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8012.jpg" +"8013" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8013.jpg" +"8014" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8014.jpg" +"8015" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8015.jpg" +"8016" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8016.jpg" +"8017" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8017.jpg" +"8018" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8018.jpg" +"8019" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8019.jpg" +"8020" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8020.jpg" +"8021" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8021.jpg" +"8022" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8022.jpg" +"8023" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8023.jpg" +"8024" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8024.jpg" +"8025" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8025.jpg" +"8026" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8026.jpg" +"8027" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8027.jpg" +"8028" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8028.jpg" +"8029" "Are there two dogs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8029.jpg" +"8030" "Are there three dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8030.jpg" +"8031" "Is the table tidy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8031.jpg" +"8032" "Is the table messy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8032.jpg" +"8033" "Is there one pad in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8033.jpg" +"8034" "Are there two pads in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8034.jpg" +"8035" "Is there one phone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8035.jpg" +"8036" "Are there two phones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8036.jpg" +"8037" "Is there one watch in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8037.jpg" +"8038" "Are there two watches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8038.jpg" +"8039" "Is there one earphone in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8039.jpg" +"8040" "Are there two earphones in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8040.jpg" +"8041" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8041.jpg" +"8042" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8042.jpg" +"8043" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8043.jpg" +"8044" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8044.jpg" +"8045" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8045.jpg" +"8046" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8046.jpg" +"8047" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8047.jpg" +"8048" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8048.jpg" +"8049" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8049.jpg" +"8050" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8050.jpg" +"8051" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8051.jpg" +"8052" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8052.jpg" +"8053" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8053.jpg" +"8054" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8054.jpg" +"8055" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8055.jpg" +"8056" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8056.jpg" +"8057" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8057.jpg" +"8058" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8058.jpg" +"8059" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8059.jpg" +"8060" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8060.jpg" +"8061" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8061.jpg" +"8062" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8062.jpg" +"8063" "Is the sky red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8063.jpg" +"8064" "Is the sky white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8064.jpg" +"8065" "Is the signal green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8065.jpg" +"8066" "Is the signal yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8066.jpg" +"8067" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8067.jpg" +"8068" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8068.jpg" +"8069" "Is there one bird in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8069.jpg" +"8070" "Are there two birds in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8070.jpg" +"8071" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8071.jpg" +"8072" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8072.jpg" +"8073" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8073.jpg" +"8074" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8074.jpg" +"8075" "Is the tree yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8075.jpg" +"8076" "Is the tree green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8076.jpg" +"8077" "Is the grass withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8077.jpg" +"8078" "Is the grass lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8078.jpg" +"8079" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8079.jpg" +"8080" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8080.jpg" +"8081" "Is there one house in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8081.jpg" +"8082" "Are there two houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8082.jpg" +"8083" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8083.jpg" +"8084" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8084.jpg" +"8085" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8085.jpg" +"8086" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8086.jpg" +"8087" "Is the ground muddy in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8087.jpg" +"8088" "Is the ground dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8088.jpg" +"8089" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8089.jpg" +"8090" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8090.jpg" +"8091" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8091.jpg" +"8092" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8092.jpg" +"8093" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8093.jpg" +"8094" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8094.jpg" +"8095" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8095.jpg" +"8096" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8096.jpg" +"8097" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8097.jpg" +"8098" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8098.jpg" +"8099" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8099.jpg" +"8100" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8100.jpg" +"8101" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8101.jpg" +"8102" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8102.jpg" +"8103" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8103.jpg" +"8104" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8104.jpg" +"8105" "Is the flower blooming in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8105.jpg" +"8106" "Is the flower withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8106.jpg" +"8107" "Is there one mushroom in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8107.jpg" +"8108" "Are there two mushrooms in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8108.jpg" +"8109" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8109.jpg" +"8110" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8110.jpg" +"8111" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8111.jpg" +"8112" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8112.jpg" +"8113" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8113.jpg" +"8114" "Are there two pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8114.jpg" +"8115" "Is there one notebook in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8115.jpg" +"8116" "Are there two notebooks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8116.jpg" +"8117" "Is the book open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8117.jpg" +"8118" "Is the book closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8118.jpg" +"8119" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8119.jpg" +"8120" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8120.jpg" +"8121" "Is the bridge long in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8121.jpg" +"8122" "Is the bridge short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8122.jpg" +"8123" "Is the sea calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8123.jpg" +"8124" "Is the sea stormy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8124.jpg" +"8125" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8125.jpg" +"8126" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8126.jpg" +"8127" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8127.jpg" +"8128" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8128.jpg" +"8129" "Are there two chairs in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8129.jpg" +"8130" "Are there three chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8130.jpg" +"8131" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8131.jpg" +"8132" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8132.jpg" +"8133" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8133.jpg" +"8134" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8134.jpg" +"8135" "Is the plate white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8135.jpg" +"8136" "Is the plate black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8136.jpg" +"8137" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8137.jpg" +"8138" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8138.jpg" +"8139" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8139.jpg" +"8140" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8140.jpg" +"8141" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8141.jpg" +"8142" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8142.jpg" +"8143" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8143.jpg" +"8144" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8144.jpg" +"8145" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8145.jpg" +"8146" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8146.jpg" +"8147" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8147.jpg" +"8148" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8148.jpg" +"8149" "Are there five trees in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8149.jpg" +"8150" "Are there six trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8150.jpg" +"8151" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8151.jpg" +"8152" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8152.jpg" +"8153" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8153.jpg" +"8154" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8154.jpg" +"8155" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8155.jpg" +"8156" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8156.jpg" +"8157" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8157.jpg" +"8158" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8158.jpg" +"8159" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8159.jpg" +"8160" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8160.jpg" +"8161" "Is the house old in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8161.jpg" +"8162" "Is the house brand new in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8162.jpg" +"8163" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8163.jpg" +"8164" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8164.jpg" +"8165" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8165.jpg" +"8166" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8166.jpg" +"8167" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8167.jpg" +"8168" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8168.jpg" +"8169" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8169.jpg" +"8170" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8170.jpg" +"8171" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8171.jpg" +"8172" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8172.jpg" +"8173" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8173.jpg" +"8174" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8174.jpg" +"8175" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8175.jpg" +"8176" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8176.jpg" +"8177" "Is the dog lie down in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8177.jpg" +"8178" "Is the dog stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8178.jpg" +"8179" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8179.jpg" +"8180" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8180.jpg" +"8181" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8181.jpg" +"8182" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8182.jpg" +"8183" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8183.jpg" +"8184" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8184.jpg" +"8185" "Is the sunflower dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8185.jpg" +"8186" "Is the sunflower sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8186.jpg" +"8187" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8187.jpg" +"8188" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8188.jpg" +"8189" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8189.jpg" +"8190" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8190.jpg" +"8191" "Is the sofa yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8191.jpg" +"8192" "Is the sofa white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8192.jpg" +"8193" "Is the laptop open in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8193.jpg" +"8194" "Is the laptop closed in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8194.jpg" +"8195" "Is there one notebook in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8195.jpg" +"8196" "Are there two notebooks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8196.jpg" +"8197" "Is there one pen in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8197.jpg" +"8198" "Are there two pens in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8198.jpg" +"8199" "Is there one watch in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8199.jpg" +"8200" "Are there two watches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8200.jpg" +"8201" "Is the pad closed in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8201.jpg" +"8202" "Is the pad open in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8202.jpg" +"8203" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8203.jpg" +"8204" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8204.jpg" +"8205" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8205.jpg" +"8206" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8206.jpg" +"8207" "Is the bridge curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8207.jpg" +"8208" "Is the bridge straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8208.jpg" +"8209" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8209.jpg" +"8210" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8210.jpg" +"8211" "Is the lake murky in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8211.jpg" +"8212" "Is the lake clear in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8212.jpg" +"8213" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8213.jpg" +"8214" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8214.jpg" +"8215" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8215.jpg" +"8216" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8216.jpg" +"8217" "Is the sea blue in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8217.jpg" +"8218" "Is the sea black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8218.jpg" +"8219" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8219.jpg" +"8220" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8220.jpg" +"8221" "Is the forest withered in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8221.jpg" +"8222" "Is the forest lively in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8222.jpg" +"8223" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8223.jpg" +"8224" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8224.jpg" +"8225" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8225.jpg" +"8226" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8226.jpg" +"8227" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8227.jpg" +"8228" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8228.jpg" +"8229" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8229.jpg" +"8230" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8230.jpg" +"8231" "Is the island small in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8231.jpg" +"8232" "Is the island large in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8232.jpg" +"8233" "Is the sea wide in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8233.jpg" +"8234" "Is the sea small in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8234.jpg" +"8235" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8235.jpg" +"8236" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8236.jpg" +"8237" "Is the sun dazzling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8237.jpg" +"8238" "Is the sun dim in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8238.jpg" +"8239" "Is the sea sparkling in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8239.jpg" +"8240" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8240.jpg" +"8241" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8241.jpg" +"8242" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8242.jpg" +"8243" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8243.jpg" +"8244" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8244.jpg" +"8245" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8245.jpg" +"8246" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8246.jpg" +"8247" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8247.jpg" +"8248" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8248.jpg" +"8249" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8249.jpg" +"8250" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8250.jpg" +"8251" "Is there one ship in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8251.jpg" +"8252" "Are there two ships in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8252.jpg" +"8253" "Is there one man in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8253.jpg" +"8254" "Are there two men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8254.jpg" +"8255" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8255.jpg" +"8256" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8256.jpg" +"8257" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8257.jpg" +"8258" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8258.jpg" +"8259" "Is there one tree in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8259.jpg" +"8260" "Are there two trees in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8260.jpg" +"8261" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8261.jpg" +"8262" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8262.jpg" +"8263" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8263.jpg" +"8264" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8264.jpg" +"8265" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8265.jpg" +"8266" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8266.jpg" +"8267" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8267.jpg" +"8268" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8268.jpg" +"8269" "Does the woman stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8269.jpg" +"8270" "Does the woman sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8270.jpg" +"8271" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8271.jpg" +"8272" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8272.jpg" +"8273" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8273.jpg" +"8274" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8274.jpg" +"8275" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8275.jpg" +"8276" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8276.jpg" +"8277" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8277.jpg" +"8278" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8278.jpg" +"8279" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8279.jpg" +"8280" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8280.jpg" +"8281" "Is the tree thick in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8281.jpg" +"8282" "Is the tree thin in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8282.jpg" +"8283" "Is there one lion in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8283.jpg" +"8284" "Are there two lions in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8284.jpg" +"8285" "Is the beach flat in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8285.jpg" +"8286" "Is the beach uneven in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8286.jpg" +"8287" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8287.jpg" +"8288" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8288.jpg" +"8289" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8289.jpg" +"8290" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8290.jpg" +"8291" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8291.jpg" +"8292" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8292.jpg" +"8293" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8293.jpg" +"8294" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8294.jpg" +"8295" "Is the beach wet in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8295.jpg" +"8296" "Is the beach dry in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8296.jpg" +"8297" "Is there one tortoise in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8297.jpg" +"8298" "Are there two tortoises in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8298.jpg" +"8299" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8299.jpg" +"8300" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8300.jpg" +"8301" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8301.jpg" +"8302" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8302.jpg" +"8303" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8303.jpg" +"8304" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8304.jpg" +"8305" "Is the road uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8305.jpg" +"8306" "Is the road flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8306.jpg" +"8307" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8307.jpg" +"8308" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8308.jpg" +"8309" "Is the sea rolling waves in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8309.jpg" +"8310" "Is the sea calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8310.jpg" +"8311" "Are there two men in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8311.jpg" +"8312" "Are there three men in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8312.jpg" +"8313" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8313.jpg" +"8314" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8314.jpg" +"8315" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8315.jpg" +"8316" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8316.jpg" +"8317" "Is the island small in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8317.jpg" +"8318" "Is the island large in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8318.jpg" +"8319" "Is the woman sit in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8319.jpg" +"8320" "Is the woman stand in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8320.jpg" +"8321" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8321.jpg" +"8322" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8322.jpg" +"8323" "Is there one watch in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8323.jpg" +"8324" "Are there two watches in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8324.jpg" +"8325" "Does the person sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8325.jpg" +"8326" "Does the person stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8326.jpg" +"8327" "Is there one chair in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8327.jpg" +"8328" "Are there two chairs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8328.jpg" +"8329" "Is there one dog in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8329.jpg" +"8330" "Are there two dogs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8330.jpg" +"8331" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8331.jpg" +"8332" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8332.jpg" +"8333" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8333.jpg" +"8334" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8334.jpg" +"8335" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8335.jpg" +"8336" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8336.jpg" +"8337" "Does the dog sit in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8337.jpg" +"8338" "Does the dog lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8338.jpg" +"8339" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8339.jpg" +"8340" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8340.jpg" +"8341" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8341.jpg" +"8342" "Does the dog stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8342.jpg" +"8343" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8343.jpg" +"8344" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8344.jpg" +"8345" "Does the dog lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8345.jpg" +"8346" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8346.jpg" +"8347" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8347.jpg" +"8348" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8348.jpg" +"8349" "Does the dog swim in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8349.jpg" +"8350" "Does the dog run in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8350.jpg" +"8351" "Is the lake murky in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8351.jpg" +"8352" "Is the lake clear in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8352.jpg" +"8353" "Is there one duck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8353.jpg" +"8354" "Are there two ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8354.jpg" +"8355" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8355.jpg" +"8356" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8356.jpg" +"8357" "Are there two ducks in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8357.jpg" +"8358" "Are there three ducks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8358.jpg" +"8359" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8359.jpg" +"8360" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8360.jpg" +"8361" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8361.jpg" +"8362" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8362.jpg" +"8363" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8363.jpg" +"8364" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8364.jpg" +"8365" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8365.jpg" +"8366" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8366.jpg" +"8367" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8367.jpg" +"8368" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8368.jpg" +"8369" "Is there one goose in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8369.jpg" +"8370" "Are there two geese in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8370.jpg" +"8371" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8371.jpg" +"8372" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8372.jpg" +"8373" "Is the lake calm in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8373.jpg" +"8374" "Is the lake rolling in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8374.jpg" +"8375" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8375.jpg" +"8376" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8376.jpg" +"8377" "Are there three fish in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8377.jpg" +"8378" "Are there four fish in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8378.jpg" +"8379" "Is the flower vibrant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8379.jpg" +"8380" "Is the flower plain in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8380.jpg" +"8381" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8381.jpg" +"8382" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8382.jpg" +"8383" "Is the flower vibrant in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8383.jpg" +"8384" "Is the flower plain in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8384.jpg" +"8385" "Is the tablecloth clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8385.jpg" +"8386" "Is the tablecloth dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8386.jpg" +"8387" "Is there one vase in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8387.jpg" +"8388" "Are there two vases in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8388.jpg" +"8389" "Is the glass white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8389.jpg" +"8390" "Is the glass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8390.jpg" +"8391" "Is the grapefruit separated in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8391.jpg" +"8392" "Is the grapefruit complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8392.jpg" +"8393" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8393.jpg" +"8394" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8394.jpg" +"8395" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8395.jpg" +"8396" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8396.jpg" +"8397" "Is there one house in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8397.jpg" +"8398" "Are there two houses in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8398.jpg" +"8399" "Is there one lemon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8399.jpg" +"8400" "Are there two lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8400.jpg" +"8401" "Is there one lemon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8401.jpg" +"8402" "Are there two lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8402.jpg" +"8403" "Is there one orange in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8403.jpg" +"8404" "Are there two oranges in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8404.jpg" +"8405" "Is there one grapefruit in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8405.jpg" +"8406" "Are there two grapefruits in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8406.jpg" +"8407" "Are there two lemons in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8407.jpg" +"8408" "Are there three lemons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8408.jpg" +"8409" "Is the shrimp raw in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8409.jpg" +"8410" "Is the shrimp ripe in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8410.jpg" +"8411" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8411.jpg" +"8412" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8412.jpg" +"8413" "Is the lemon yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8413.jpg" +"8414" "Is the lemon green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8414.jpg" +"8415" "Is there one lion in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8415.jpg" +"8416" "Are there two lions in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8416.jpg" +"8417" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8417.jpg" +"8418" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8418.jpg" +"8419" "Are there three cars in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8419.jpg" +"8420" "Are there four cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8420.jpg" +"8421" "Does the tiger stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8421.jpg" +"8422" "Does the tiger sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8422.jpg" +"8423" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8423.jpg" +"8424" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8424.jpg" +"8425" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8425.jpg" +"8426" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8426.jpg" +"8427" "Are there two lions in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8427.jpg" +"8428" "Are there three lions in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8428.jpg" +"8429" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8429.jpg" +"8430" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8430.jpg" +"8431" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8431.jpg" +"8432" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8432.jpg" +"8433" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8433.jpg" +"8434" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8434.jpg" +"8435" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8435.jpg" +"8436" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8436.jpg" +"8437" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8437.jpg" +"8438" "Is the cloud yellow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8438.jpg" +"8439" "Does the lion open your mouth in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8439.jpg" +"8440" "Does the lion close your mouth in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8440.jpg" +"8441" "Are there six tangerines in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8441.jpg" +"8442" "Are there seven tangerines in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8442.jpg" +"8443" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8443.jpg" +"8444" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8444.jpg" +"8445" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8445.jpg" +"8446" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8446.jpg" +"8447" "Is the tangerine yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8447.jpg" +"8448" "Is the tangerine white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8448.jpg" +"8449" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8449.jpg" +"8450" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8450.jpg" +"8451" "Are there two drawings in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8451.jpg" +"8452" "Are there three drawings in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8452.jpg" +"8453" "Is there one pig in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8453.jpg" +"8454" "Are there two pigs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8454.jpg" +"8455" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8455.jpg" +"8456" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8456.jpg" +"8457" "Is the fence white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8457.jpg" +"8458" "Is the fence red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8458.jpg" +"8459" "Is there one skate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8459.jpg" +"8460" "Are there two skates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8460.jpg" +"8461" "Is the floor yellow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8461.jpg" +"8462" "Is the floor black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8462.jpg" +"8463" "Is the watermelon sliced in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8463.jpg" +"8464" "Is the watermelon complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8464.jpg" +"8465" "Are there four strawberries in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8465.jpg" +"8466" "Are there five strawberries in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8466.jpg" +"8467" "Is there one pineapple in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8467.jpg" +"8468" "Are there two pineapples in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8468.jpg" +"8469" "Is the table clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8469.jpg" +"8470" "Is the table dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8470.jpg" +"8471" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8471.jpg" +"8472" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8472.jpg" +"8473" "Is there one rabbit in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8473.jpg" +"8474" "Are there two rabbits in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8474.jpg" +"8475" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8475.jpg" +"8476" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8476.jpg" +"8477" "Is there one rabbit in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8477.jpg" +"8478" "Are there two rabbits in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8478.jpg" +"8479" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8479.jpg" +"8480" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8480.jpg" +"8481" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8481.jpg" +"8482" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8482.jpg" +"8483" "Is the refrigerator white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8483.jpg" +"8484" "Is the refrigerator black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8484.jpg" +"8485" "Are there two colas in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8485.jpg" +"8486" "Are there three colas in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8486.jpg" +"8487" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8487.jpg" +"8488" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8488.jpg" +"8489" "Is the forest lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8489.jpg" +"8490" "Is the forest withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8490.jpg" +"8491" "Is the lake rippling water in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8491.jpg" +"8492" "Is the lake calm waters in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8492.jpg" +"8493" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8493.jpg" +"8494" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8494.jpg" +"8495" "Is the river turbulent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8495.jpg" +"8496" "Is the river slow in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8496.jpg" +"8497" "Is the sand uneven in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8497.jpg" +"8498" "Is the sand flat in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8498.jpg" +"8499" "Is the road narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8499.jpg" +"8500" "Is the road wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8500.jpg" +"8501" "Is the forest golden in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8501.jpg" +"8502" "Is the forest white in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8502.jpg" +"8503" "Is the ground narrow in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8503.jpg" +"8504" "Is the ground wide in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8504.jpg" +"8505" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8505.jpg" +"8506" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8506.jpg" +"8507" "Is the road clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8507.jpg" +"8508" "Is the road dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8508.jpg" +"8509" "Is the mountain tall in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8509.jpg" +"8510" "Is the mountain short in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8510.jpg" +"8511" "Is the ground curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8511.jpg" +"8512" "Is the ground straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8512.jpg" +"8513" "Is the snow white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8513.jpg" +"8514" "Is the snow black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8514.jpg" +"8515" "Is the ground curved in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8515.jpg" +"8516" "Is the ground straight in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8516.jpg" +"8517" "Is the ground dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8517.jpg" +"8518" "Is the ground wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8518.jpg" +"8519" "Is the sign prominent in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8519.jpg" +"8520" "Is the sign hidden in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8520.jpg" +"8521" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8521.jpg" +"8522" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8522.jpg" +"8523" "Is the cream pink in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8523.jpg" +"8524" "Is the cream green in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8524.jpg" +"8525" "Is the strawberry red in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8525.jpg" +"8526" "Is the strawberry black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8526.jpg" +"8527" "Is the cream white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8527.jpg" +"8528" "Is the cream blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8528.jpg" +"8529" "Is there one plate in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8529.jpg" +"8530" "Are there two plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8530.jpg" +"8531" "Are there six strawberries in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8531.jpg" +"8532" "Are there seven strawberries in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8532.jpg" +"8533" "Is the cake round in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8533.jpg" +"8534" "Is the cake square in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8534.jpg" +"8535" "Is the candle extinguished in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8535.jpg" +"8536" "Is the candle burning in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8536.jpg" +"8537" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8537.jpg" +"8538" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8538.jpg" +"8539" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8539.jpg" +"8540" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8540.jpg" +"8541" "Is there one car in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8541.jpg" +"8542" "Are there two cars in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8542.jpg" +"8543" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8543.jpg" +"8544" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8544.jpg" +"8545" "Is the ground clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8545.jpg" +"8546" "Is the ground dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8546.jpg" +"8547" "Is there one table in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8547.jpg" +"8548" "Are there two tables in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8548.jpg" +"8549" "Is the floor clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8549.jpg" +"8550" "Is the floor dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8550.jpg" +"8551" "Is the wall white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8551.jpg" +"8552" "Is the wall black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8552.jpg" +"8553" "Is there one tiger in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8553.jpg" +"8554" "Are there two tigers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8554.jpg" +"8555" "Is the grass lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8555.jpg" +"8556" "Is the grass withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8556.jpg" +"8557" "Does the tiger lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8557.jpg" +"8558" "Does the tiger stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8558.jpg" +"8559" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8559.jpg" +"8560" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8560.jpg" +"8561" "Does the tiger stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8561.jpg" +"8562" "Does the tiger lie prone in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8562.jpg" +"8563" "Is the grass dense in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8563.jpg" +"8564" "Is the grass sparse in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8564.jpg" +"8565" "Does the tiger lie prone in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8565.jpg" +"8566" "Does the tiger stand in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8566.jpg" +"8567" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8567.jpg" +"8568" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8568.jpg" +"8569" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8569.jpg" +"8570" "Is the grass blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8570.jpg" +"8571" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8571.jpg" +"8572" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8572.jpg" +"8573" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8573.jpg" +"8574" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8574.jpg" +"8575" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8575.jpg" +"8576" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8576.jpg" +"8577" "Is the tree lively in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8577.jpg" +"8578" "Is the tree withered in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8578.jpg" +"8579" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8579.jpg" +"8580" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8580.jpg" +"8581" "Is the mountain short in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8581.jpg" +"8582" "Is the mountain tall in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8582.jpg" +"8583" "Is the forest green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8583.jpg" +"8584" "Is the forest blue in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8584.jpg" +"8585" "Is there one truck in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8585.jpg" +"8586" "Are there two trucks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8586.jpg" +"8587" "Is the grass green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8587.jpg" +"8588" "Is the grass black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8588.jpg" +"8589" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8589.jpg" +"8590" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8590.jpg" +"8591" "Is there one volleyball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8591.jpg" +"8592" "Are there two volleyballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8592.jpg" +"8593" "Is the beach dry in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8593.jpg" +"8594" "Is the beach wet in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8594.jpg" +"8595" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8595.jpg" +"8596" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8596.jpg" +"8597" "Are there two people in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8597.jpg" +"8598" "Are there three people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8598.jpg" +"8599" "Is there one volleyball in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8599.jpg" +"8600" "Are there two volleyballs in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8600.jpg" +"8601" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8601.jpg" +"8602" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8602.jpg" +"8603" "Are there four flowers in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8603.jpg" +"8604" "Are there five flowers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8604.jpg" +"8605" "Is the watermelon separated in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8605.jpg" +"8606" "Is the watermelon complete in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8606.jpg" +"8607" "Is there one fork in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8607.jpg" +"8608" "Are there two forks in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8608.jpg" +"8609" "Is there one scoon in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8609.jpg" +"8610" "Are there two scoons in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8610.jpg" +"8611" "Is there one ginger in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8611.jpg" +"8612" "Are there two gingers in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8612.jpg" +"8613" "Is the leave green in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8613.jpg" +"8614" "Is the leave red in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8614.jpg" +"8615" "Are there two plates in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8615.jpg" +"8616" "Are there three plates in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8616.jpg" +"8617" "Is the sky sunny in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8617.jpg" +"8618" "Is the sky gloomy in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8618.jpg" +"8619" "Is the cloud white in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8619.jpg" +"8620" "Is the cloud black in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8620.jpg" +"8621" "Is there one person in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8621.jpg" +"8622" "Are there two people in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8622.jpg" +"8623" "Is the wall clean in this image?" "yes" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8623.jpg" +"8624" "Is the wall dirty in this image?" "no" "discriminative-attribute-state" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8624.jpg" +"8625" "Does the man stand in this image?" "yes" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8625.jpg" +"8626" "Does the man sit in this image?" "no" "discriminative-attribute-action" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8626.jpg" +"8627" "Are there two urinals in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8627.jpg" +"8628" "Are there three urinals in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8628.jpg" +"8629" "Is there one hat in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8629.jpg" +"8630" "Are there two hats in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8630.jpg" +"8631" "Is there one cup in this image?" "yes" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8631.jpg" +"8632" "Are there two cups in this image?" "no" "discriminative-attribute-number" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8632.jpg" +"8633" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8633.jpg" +"8634" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8634.jpg" +"8635" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8635.jpg" +"8636" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8636.jpg" +"8637" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8637.jpg" +"8638" "Is there a plane in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8638.jpg" +"8639" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8639.jpg" +"8640" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8640.jpg" +"8641" "Is there a paddle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8641.jpg" +"8642" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8642.jpg" +"8643" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8643.jpg" +"8644" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8644.jpg" +"8645" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8645.jpg" +"8646" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8646.jpg" +"8647" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8647.jpg" +"8648" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8648.jpg" +"8649" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8649.jpg" +"8650" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8650.jpg" +"8651" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8651.jpg" +"8652" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8652.jpg" +"8653" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8653.jpg" +"8654" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8654.jpg" +"8655" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8655.jpg" +"8656" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8656.jpg" +"8657" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8657.jpg" +"8658" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8658.jpg" +"8659" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8659.jpg" +"8660" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8660.jpg" +"8661" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8661.jpg" +"8662" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8662.jpg" +"8663" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8663.jpg" +"8664" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8664.jpg" +"8665" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8665.jpg" +"8666" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8666.jpg" +"8667" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8667.jpg" +"8668" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8668.jpg" +"8669" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8669.jpg" +"8670" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8670.jpg" +"8671" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8671.jpg" +"8672" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8672.jpg" +"8673" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8673.jpg" +"8674" "Is there a goal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8674.jpg" +"8675" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8675.jpg" +"8676" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8676.jpg" +"8677" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8677.jpg" +"8678" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8678.jpg" +"8679" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8679.jpg" +"8680" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8680.jpg" +"8681" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8681.jpg" +"8682" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8682.jpg" +"8683" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8683.jpg" +"8684" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8684.jpg" +"8685" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8685.jpg" +"8686" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8686.jpg" +"8687" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8687.jpg" +"8688" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8688.jpg" +"8689" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8689.jpg" +"8690" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8690.jpg" +"8691" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8691.jpg" +"8692" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8692.jpg" +"8693" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8693.jpg" +"8694" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8694.jpg" +"8695" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8695.jpg" +"8696" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8696.jpg" +"8697" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8697.jpg" +"8698" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8698.jpg" +"8699" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8699.jpg" +"8700" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8700.jpg" +"8701" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8701.jpg" +"8702" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8702.jpg" +"8703" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8703.jpg" +"8704" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8704.jpg" +"8705" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8705.jpg" +"8706" "Is there a camel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8706.jpg" +"8707" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8707.jpg" +"8708" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8708.jpg" +"8709" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8709.jpg" +"8710" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8710.jpg" +"8711" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8711.jpg" +"8712" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8712.jpg" +"8713" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8713.jpg" +"8714" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8714.jpg" +"8715" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8715.jpg" +"8716" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8716.jpg" +"8717" "Is there a camera in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8717.jpg" +"8718" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8718.jpg" +"8719" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8719.jpg" +"8720" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8720.jpg" +"8721" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8721.jpg" +"8722" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8722.jpg" +"8723" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8723.jpg" +"8724" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8724.jpg" +"8725" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8725.jpg" +"8726" "Is there a squirrel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8726.jpg" +"8727" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8727.jpg" +"8728" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8728.jpg" +"8729" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8729.jpg" +"8730" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8730.jpg" +"8731" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8731.jpg" +"8732" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8732.jpg" +"8733" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8733.jpg" +"8734" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8734.jpg" +"8735" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8735.jpg" +"8736" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8736.jpg" +"8737" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8737.jpg" +"8738" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8738.jpg" +"8739" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8739.jpg" +"8740" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8740.jpg" +"8741" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8741.jpg" +"8742" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8742.jpg" +"8743" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8743.jpg" +"8744" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8744.jpg" +"8745" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8745.jpg" +"8746" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8746.jpg" +"8747" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8747.jpg" +"8748" "Is there a dustbin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8748.jpg" +"8749" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8749.jpg" +"8750" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8750.jpg" +"8751" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8751.jpg" +"8752" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8752.jpg" +"8753" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8753.jpg" +"8754" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8754.jpg" +"8755" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8755.jpg" +"8756" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8756.jpg" +"8757" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8757.jpg" +"8758" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8758.jpg" +"8759" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8759.jpg" +"8760" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8760.jpg" +"8761" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8761.jpg" +"8762" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8762.jpg" +"8763" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8763.jpg" +"8764" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8764.jpg" +"8765" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8765.jpg" +"8766" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8766.jpg" +"8767" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8767.jpg" +"8768" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8768.jpg" +"8769" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8769.jpg" +"8770" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8770.jpg" +"8771" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8771.jpg" +"8772" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8772.jpg" +"8773" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8773.jpg" +"8774" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8774.jpg" +"8775" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8775.jpg" +"8776" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8776.jpg" +"8777" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8777.jpg" +"8778" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8778.jpg" +"8779" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8779.jpg" +"8780" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8780.jpg" +"8781" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8781.jpg" +"8782" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8782.jpg" +"8783" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8783.jpg" +"8784" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8784.jpg" +"8785" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8785.jpg" +"8786" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8786.jpg" +"8787" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8787.jpg" +"8788" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8788.jpg" +"8789" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8789.jpg" +"8790" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8790.jpg" +"8791" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8791.jpg" +"8792" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8792.jpg" +"8793" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8793.jpg" +"8794" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8794.jpg" +"8795" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8795.jpg" +"8796" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8796.jpg" +"8797" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8797.jpg" +"8798" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8798.jpg" +"8799" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8799.jpg" +"8800" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8800.jpg" +"8801" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8801.jpg" +"8802" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8802.jpg" +"8803" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8803.jpg" +"8804" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8804.jpg" +"8805" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8805.jpg" +"8806" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8806.jpg" +"8807" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8807.jpg" +"8808" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8808.jpg" +"8809" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8809.jpg" +"8810" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8810.jpg" +"8811" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8811.jpg" +"8812" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8812.jpg" +"8813" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8813.jpg" +"8814" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8814.jpg" +"8815" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8815.jpg" +"8816" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8816.jpg" +"8817" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8817.jpg" +"8818" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8818.jpg" +"8819" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8819.jpg" +"8820" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8820.jpg" +"8821" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8821.jpg" +"8822" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8822.jpg" +"8823" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8823.jpg" +"8824" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8824.jpg" +"8825" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8825.jpg" +"8826" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8826.jpg" +"8827" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8827.jpg" +"8828" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8828.jpg" +"8829" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8829.jpg" +"8830" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8830.jpg" +"8831" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8831.jpg" +"8832" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8832.jpg" +"8833" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8833.jpg" +"8834" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8834.jpg" +"8835" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8835.jpg" +"8836" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8836.jpg" +"8837" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8837.jpg" +"8838" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8838.jpg" +"8839" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8839.jpg" +"8840" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8840.jpg" +"8841" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8841.jpg" +"8842" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8842.jpg" +"8843" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8843.jpg" +"8844" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8844.jpg" +"8845" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8845.jpg" +"8846" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8846.jpg" +"8847" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8847.jpg" +"8848" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8848.jpg" +"8849" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8849.jpg" +"8850" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8850.jpg" +"8851" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8851.jpg" +"8852" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8852.jpg" +"8853" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8853.jpg" +"8854" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8854.jpg" +"8855" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8855.jpg" +"8856" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8856.jpg" +"8857" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8857.jpg" +"8858" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8858.jpg" +"8859" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8859.jpg" +"8860" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8860.jpg" +"8861" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8861.jpg" +"8862" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8862.jpg" +"8863" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8863.jpg" +"8864" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8864.jpg" +"8865" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8865.jpg" +"8866" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8866.jpg" +"8867" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8867.jpg" +"8868" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8868.jpg" +"8869" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8869.jpg" +"8870" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8870.jpg" +"8871" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8871.jpg" +"8872" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8872.jpg" +"8873" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8873.jpg" +"8874" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8874.jpg" +"8875" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8875.jpg" +"8876" "Is there a bus in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8876.jpg" +"8877" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8877.jpg" +"8878" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8878.jpg" +"8879" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8879.jpg" +"8880" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8880.jpg" +"8881" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8881.jpg" +"8882" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8882.jpg" +"8883" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8883.jpg" +"8884" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8884.jpg" +"8885" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8885.jpg" +"8886" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8886.jpg" +"8887" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8887.jpg" +"8888" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8888.jpg" +"8889" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8889.jpg" +"8890" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8890.jpg" +"8891" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8891.jpg" +"8892" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8892.jpg" +"8893" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8893.jpg" +"8894" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8894.jpg" +"8895" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8895.jpg" +"8896" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8896.jpg" +"8897" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8897.jpg" +"8898" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8898.jpg" +"8899" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8899.jpg" +"8900" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8900.jpg" +"8901" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8901.jpg" +"8902" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8902.jpg" +"8903" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8903.jpg" +"8904" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8904.jpg" +"8905" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8905.jpg" +"8906" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8906.jpg" +"8907" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8907.jpg" +"8908" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8908.jpg" +"8909" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8909.jpg" +"8910" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8910.jpg" +"8911" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8911.jpg" +"8912" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8912.jpg" +"8913" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8913.jpg" +"8914" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8914.jpg" +"8915" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8915.jpg" +"8916" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8916.jpg" +"8917" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8917.jpg" +"8918" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8918.jpg" +"8919" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8919.jpg" +"8920" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8920.jpg" +"8921" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8921.jpg" +"8922" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8922.jpg" +"8923" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8923.jpg" +"8924" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8924.jpg" +"8925" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8925.jpg" +"8926" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8926.jpg" +"8927" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8927.jpg" +"8928" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8928.jpg" +"8929" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8929.jpg" +"8930" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8930.jpg" +"8931" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8931.jpg" +"8932" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8932.jpg" +"8933" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8933.jpg" +"8934" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8934.jpg" +"8935" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8935.jpg" +"8936" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8936.jpg" +"8937" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8937.jpg" +"8938" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8938.jpg" +"8939" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8939.jpg" +"8940" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8940.jpg" +"8941" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8941.jpg" +"8942" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8942.jpg" +"8943" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8943.jpg" +"8944" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8944.jpg" +"8945" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8945.jpg" +"8946" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8946.jpg" +"8947" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8947.jpg" +"8948" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8948.jpg" +"8949" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8949.jpg" +"8950" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8950.jpg" +"8951" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8951.jpg" +"8952" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8952.jpg" +"8953" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8953.jpg" +"8954" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8954.jpg" +"8955" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8955.jpg" +"8956" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8956.jpg" +"8957" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8957.jpg" +"8958" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8958.jpg" +"8959" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8959.jpg" +"8960" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8960.jpg" +"8961" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8961.jpg" +"8962" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8962.jpg" +"8963" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8963.jpg" +"8964" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8964.jpg" +"8965" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8965.jpg" +"8966" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8966.jpg" +"8967" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8967.jpg" +"8968" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8968.jpg" +"8969" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8969.jpg" +"8970" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8970.jpg" +"8971" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8971.jpg" +"8972" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8972.jpg" +"8973" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8973.jpg" +"8974" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8974.jpg" +"8975" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8975.jpg" +"8976" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8976.jpg" +"8977" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8977.jpg" +"8978" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8978.jpg" +"8979" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8979.jpg" +"8980" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8980.jpg" +"8981" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8981.jpg" +"8982" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8982.jpg" +"8983" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8983.jpg" +"8984" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8984.jpg" +"8985" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8985.jpg" +"8986" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8986.jpg" +"8987" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8987.jpg" +"8988" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8988.jpg" +"8989" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8989.jpg" +"8990" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8990.jpg" +"8991" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8991.jpg" +"8992" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8992.jpg" +"8993" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8993.jpg" +"8994" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8994.jpg" +"8995" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8995.jpg" +"8996" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8996.jpg" +"8997" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8997.jpg" +"8998" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8998.jpg" +"8999" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/8999.jpg" +"9000" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9000.jpg" +"9001" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9001.jpg" +"9002" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9002.jpg" +"9003" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9003.jpg" +"9004" "Is there a bridge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9004.jpg" +"9005" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9005.jpg" +"9006" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9006.jpg" +"9007" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9007.jpg" +"9008" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9008.jpg" +"9009" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9009.jpg" +"9010" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9010.jpg" +"9011" "Is there a glass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9011.jpg" +"9012" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9012.jpg" +"9013" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9013.jpg" +"9014" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9014.jpg" +"9015" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9015.jpg" +"9016" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9016.jpg" +"9017" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9017.jpg" +"9018" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9018.jpg" +"9019" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9019.jpg" +"9020" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9020.jpg" +"9021" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9021.jpg" +"9022" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9022.jpg" +"9023" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9023.jpg" +"9024" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9024.jpg" +"9025" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9025.jpg" +"9026" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9026.jpg" +"9027" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9027.jpg" +"9028" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9028.jpg" +"9029" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9029.jpg" +"9030" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9030.jpg" +"9031" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9031.jpg" +"9032" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9032.jpg" +"9033" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9033.jpg" +"9034" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9034.jpg" +"9035" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9035.jpg" +"9036" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9036.jpg" +"9037" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9037.jpg" +"9038" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9038.jpg" +"9039" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9039.jpg" +"9040" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9040.jpg" +"9041" "Is there a toilet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9041.jpg" +"9042" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9042.jpg" +"9043" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9043.jpg" +"9044" "Is there a shampoo in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9044.jpg" +"9045" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9045.jpg" +"9046" "Is there a toilet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9046.jpg" +"9047" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9047.jpg" +"9048" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9048.jpg" +"9049" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9049.jpg" +"9050" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9050.jpg" +"9051" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9051.jpg" +"9052" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9052.jpg" +"9053" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9053.jpg" +"9054" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9054.jpg" +"9055" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9055.jpg" +"9056" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9056.jpg" +"9057" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9057.jpg" +"9058" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9058.jpg" +"9059" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9059.jpg" +"9060" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9060.jpg" +"9061" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9061.jpg" +"9062" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9062.jpg" +"9063" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9063.jpg" +"9064" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9064.jpg" +"9065" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9065.jpg" +"9066" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9066.jpg" +"9067" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9067.jpg" +"9068" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9068.jpg" +"9069" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9069.jpg" +"9070" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9070.jpg" +"9071" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9071.jpg" +"9072" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9072.jpg" +"9073" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9073.jpg" +"9074" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9074.jpg" +"9075" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9075.jpg" +"9076" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9076.jpg" +"9077" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9077.jpg" +"9078" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9078.jpg" +"9079" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9079.jpg" +"9080" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9080.jpg" +"9081" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9081.jpg" +"9082" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9082.jpg" +"9083" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9083.jpg" +"9084" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9084.jpg" +"9085" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9085.jpg" +"9086" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9086.jpg" +"9087" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9087.jpg" +"9088" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9088.jpg" +"9089" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9089.jpg" +"9090" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9090.jpg" +"9091" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9091.jpg" +"9092" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9092.jpg" +"9093" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9093.jpg" +"9094" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9094.jpg" +"9095" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9095.jpg" +"9096" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9096.jpg" +"9097" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9097.jpg" +"9098" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9098.jpg" +"9099" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9099.jpg" +"9100" "Is there a camera in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9100.jpg" +"9101" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9101.jpg" +"9102" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9102.jpg" +"9103" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9103.jpg" +"9104" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9104.jpg" +"9105" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9105.jpg" +"9106" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9106.jpg" +"9107" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9107.jpg" +"9108" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9108.jpg" +"9109" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9109.jpg" +"9110" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9110.jpg" +"9111" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9111.jpg" +"9112" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9112.jpg" +"9113" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9113.jpg" +"9114" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9114.jpg" +"9115" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9115.jpg" +"9116" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9116.jpg" +"9117" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9117.jpg" +"9118" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9118.jpg" +"9119" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9119.jpg" +"9120" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9120.jpg" +"9121" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9121.jpg" +"9122" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9122.jpg" +"9123" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9123.jpg" +"9124" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9124.jpg" +"9125" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9125.jpg" +"9126" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9126.jpg" +"9127" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9127.jpg" +"9128" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9128.jpg" +"9129" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9129.jpg" +"9130" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9130.jpg" +"9131" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9131.jpg" +"9132" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9132.jpg" +"9133" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9133.jpg" +"9134" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9134.jpg" +"9135" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9135.jpg" +"9136" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9136.jpg" +"9137" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9137.jpg" +"9138" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9138.jpg" +"9139" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9139.jpg" +"9140" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9140.jpg" +"9141" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9141.jpg" +"9142" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9142.jpg" +"9143" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9143.jpg" +"9144" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9144.jpg" +"9145" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9145.jpg" +"9146" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9146.jpg" +"9147" "Is there a microphone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9147.jpg" +"9148" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9148.jpg" +"9149" "Is there a support in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9149.jpg" +"9150" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9150.jpg" +"9151" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9151.jpg" +"9152" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9152.jpg" +"9153" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9153.jpg" +"9154" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9154.jpg" +"9155" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9155.jpg" +"9156" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9156.jpg" +"9157" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9157.jpg" +"9158" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9158.jpg" +"9159" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9159.jpg" +"9160" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9160.jpg" +"9161" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9161.jpg" +"9162" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9162.jpg" +"9163" "Is there a duck in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9163.jpg" +"9164" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9164.jpg" +"9165" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9165.jpg" +"9166" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9166.jpg" +"9167" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9167.jpg" +"9168" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9168.jpg" +"9169" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9169.jpg" +"9170" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9170.jpg" +"9171" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9171.jpg" +"9172" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9172.jpg" +"9173" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9173.jpg" +"9174" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9174.jpg" +"9175" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9175.jpg" +"9176" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9176.jpg" +"9177" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9177.jpg" +"9178" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9178.jpg" +"9179" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9179.jpg" +"9180" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9180.jpg" +"9181" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9181.jpg" +"9182" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9182.jpg" +"9183" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9183.jpg" +"9184" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9184.jpg" +"9185" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9185.jpg" +"9186" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9186.jpg" +"9187" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9187.jpg" +"9188" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9188.jpg" +"9189" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9189.jpg" +"9190" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9190.jpg" +"9191" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9191.jpg" +"9192" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9192.jpg" +"9193" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9193.jpg" +"9194" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9194.jpg" +"9195" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9195.jpg" +"9196" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9196.jpg" +"9197" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9197.jpg" +"9198" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9198.jpg" +"9199" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9199.jpg" +"9200" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9200.jpg" +"9201" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9201.jpg" +"9202" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9202.jpg" +"9203" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9203.jpg" +"9204" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9204.jpg" +"9205" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9205.jpg" +"9206" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9206.jpg" +"9207" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9207.jpg" +"9208" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9208.jpg" +"9209" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9209.jpg" +"9210" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9210.jpg" +"9211" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9211.jpg" +"9212" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9212.jpg" +"9213" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9213.jpg" +"9214" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9214.jpg" +"9215" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9215.jpg" +"9216" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9216.jpg" +"9217" "Is there a piano in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9217.jpg" +"9218" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9218.jpg" +"9219" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9219.jpg" +"9220" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9220.jpg" +"9221" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9221.jpg" +"9222" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9222.jpg" +"9223" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9223.jpg" +"9224" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9224.jpg" +"9225" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9225.jpg" +"9226" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9226.jpg" +"9227" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9227.jpg" +"9228" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9228.jpg" +"9229" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9229.jpg" +"9230" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9230.jpg" +"9231" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9231.jpg" +"9232" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9232.jpg" +"9233" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9233.jpg" +"9234" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9234.jpg" +"9235" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9235.jpg" +"9236" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9236.jpg" +"9237" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9237.jpg" +"9238" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9238.jpg" +"9239" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9239.jpg" +"9240" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9240.jpg" +"9241" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9241.jpg" +"9242" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9242.jpg" +"9243" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9243.jpg" +"9244" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9244.jpg" +"9245" "Is there a horse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9245.jpg" +"9246" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9246.jpg" +"9247" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9247.jpg" +"9248" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9248.jpg" +"9249" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9249.jpg" +"9250" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9250.jpg" +"9251" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9251.jpg" +"9252" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9252.jpg" +"9253" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9253.jpg" +"9254" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9254.jpg" +"9255" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9255.jpg" +"9256" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9256.jpg" +"9257" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9257.jpg" +"9258" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9258.jpg" +"9259" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9259.jpg" +"9260" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9260.jpg" +"9261" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9261.jpg" +"9262" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9262.jpg" +"9263" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9263.jpg" +"9264" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9264.jpg" +"9265" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9265.jpg" +"9266" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9266.jpg" +"9267" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9267.jpg" +"9268" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9268.jpg" +"9269" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9269.jpg" +"9270" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9270.jpg" +"9271" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9271.jpg" +"9272" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9272.jpg" +"9273" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9273.jpg" +"9274" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9274.jpg" +"9275" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9275.jpg" +"9276" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9276.jpg" +"9277" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9277.jpg" +"9278" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9278.jpg" +"9279" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9279.jpg" +"9280" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9280.jpg" +"9281" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9281.jpg" +"9282" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9282.jpg" +"9283" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9283.jpg" +"9284" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9284.jpg" +"9285" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9285.jpg" +"9286" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9286.jpg" +"9287" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9287.jpg" +"9288" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9288.jpg" +"9289" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9289.jpg" +"9290" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9290.jpg" +"9291" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9291.jpg" +"9292" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9292.jpg" +"9293" "Is there a camel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9293.jpg" +"9294" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9294.jpg" +"9295" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9295.jpg" +"9296" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9296.jpg" +"9297" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9297.jpg" +"9298" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9298.jpg" +"9299" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9299.jpg" +"9300" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9300.jpg" +"9301" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9301.jpg" +"9302" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9302.jpg" +"9303" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9303.jpg" +"9304" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9304.jpg" +"9305" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9305.jpg" +"9306" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9306.jpg" +"9307" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9307.jpg" +"9308" "Is there a camera in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9308.jpg" +"9309" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9309.jpg" +"9310" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9310.jpg" +"9311" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9311.jpg" +"9312" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9312.jpg" +"9313" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9313.jpg" +"9314" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9314.jpg" +"9315" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9315.jpg" +"9316" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9316.jpg" +"9317" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9317.jpg" +"9318" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9318.jpg" +"9319" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9319.jpg" +"9320" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9320.jpg" +"9321" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9321.jpg" +"9322" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9322.jpg" +"9323" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9323.jpg" +"9324" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9324.jpg" +"9325" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9325.jpg" +"9326" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9326.jpg" +"9327" "Is there a bread in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9327.jpg" +"9328" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9328.jpg" +"9329" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9329.jpg" +"9330" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9330.jpg" +"9331" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9331.jpg" +"9332" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9332.jpg" +"9333" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9333.jpg" +"9334" "Is there a snowman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9334.jpg" +"9335" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9335.jpg" +"9336" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9336.jpg" +"9337" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9337.jpg" +"9338" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9338.jpg" +"9339" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9339.jpg" +"9340" "Is there a camel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9340.jpg" +"9341" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9341.jpg" +"9342" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9342.jpg" +"9343" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9343.jpg" +"9344" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9344.jpg" +"9345" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9345.jpg" +"9346" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9346.jpg" +"9347" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9347.jpg" +"9348" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9348.jpg" +"9349" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9349.jpg" +"9350" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9350.jpg" +"9351" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9351.jpg" +"9352" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9352.jpg" +"9353" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9353.jpg" +"9354" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9354.jpg" +"9355" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9355.jpg" +"9356" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9356.jpg" +"9357" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9357.jpg" +"9358" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9358.jpg" +"9359" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9359.jpg" +"9360" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9360.jpg" +"9361" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9361.jpg" +"9362" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9362.jpg" +"9363" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9363.jpg" +"9364" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9364.jpg" +"9365" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9365.jpg" +"9366" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9366.jpg" +"9367" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9367.jpg" +"9368" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9368.jpg" +"9369" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9369.jpg" +"9370" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9370.jpg" +"9371" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9371.jpg" +"9372" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9372.jpg" +"9373" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9373.jpg" +"9374" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9374.jpg" +"9375" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9375.jpg" +"9376" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9376.jpg" +"9377" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9377.jpg" +"9378" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9378.jpg" +"9379" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9379.jpg" +"9380" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9380.jpg" +"9381" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9381.jpg" +"9382" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9382.jpg" +"9383" "Is there a court in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9383.jpg" +"9384" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9384.jpg" +"9385" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9385.jpg" +"9386" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9386.jpg" +"9387" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9387.jpg" +"9388" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9388.jpg" +"9389" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9389.jpg" +"9390" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9390.jpg" +"9391" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9391.jpg" +"9392" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9392.jpg" +"9393" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9393.jpg" +"9394" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9394.jpg" +"9395" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9395.jpg" +"9396" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9396.jpg" +"9397" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9397.jpg" +"9398" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9398.jpg" +"9399" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9399.jpg" +"9400" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9400.jpg" +"9401" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9401.jpg" +"9402" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9402.jpg" +"9403" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9403.jpg" +"9404" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9404.jpg" +"9405" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9405.jpg" +"9406" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9406.jpg" +"9407" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9407.jpg" +"9408" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9408.jpg" +"9409" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9409.jpg" +"9410" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9410.jpg" +"9411" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9411.jpg" +"9412" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9412.jpg" +"9413" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9413.jpg" +"9414" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9414.jpg" +"9415" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9415.jpg" +"9416" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9416.jpg" +"9417" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9417.jpg" +"9418" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9418.jpg" +"9419" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9419.jpg" +"9420" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9420.jpg" +"9421" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9421.jpg" +"9422" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9422.jpg" +"9423" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9423.jpg" +"9424" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9424.jpg" +"9425" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9425.jpg" +"9426" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9426.jpg" +"9427" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9427.jpg" +"9428" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9428.jpg" +"9429" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9429.jpg" +"9430" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9430.jpg" +"9431" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9431.jpg" +"9432" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9432.jpg" +"9433" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9433.jpg" +"9434" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9434.jpg" +"9435" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9435.jpg" +"9436" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9436.jpg" +"9437" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9437.jpg" +"9438" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9438.jpg" +"9439" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9439.jpg" +"9440" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9440.jpg" +"9441" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9441.jpg" +"9442" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9442.jpg" +"9443" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9443.jpg" +"9444" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9444.jpg" +"9445" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9445.jpg" +"9446" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9446.jpg" +"9447" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9447.jpg" +"9448" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9448.jpg" +"9449" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9449.jpg" +"9450" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9450.jpg" +"9451" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9451.jpg" +"9452" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9452.jpg" +"9453" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9453.jpg" +"9454" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9454.jpg" +"9455" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9455.jpg" +"9456" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9456.jpg" +"9457" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9457.jpg" +"9458" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9458.jpg" +"9459" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9459.jpg" +"9460" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9460.jpg" +"9461" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9461.jpg" +"9462" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9462.jpg" +"9463" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9463.jpg" +"9464" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9464.jpg" +"9465" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9465.jpg" +"9466" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9466.jpg" +"9467" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9467.jpg" +"9468" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9468.jpg" +"9469" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9469.jpg" +"9470" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9470.jpg" +"9471" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9471.jpg" +"9472" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9472.jpg" +"9473" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9473.jpg" +"9474" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9474.jpg" +"9475" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9475.jpg" +"9476" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9476.jpg" +"9477" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9477.jpg" +"9478" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9478.jpg" +"9479" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9479.jpg" +"9480" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9480.jpg" +"9481" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9481.jpg" +"9482" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9482.jpg" +"9483" "Is there a scoon in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9483.jpg" +"9484" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9484.jpg" +"9485" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9485.jpg" +"9486" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9486.jpg" +"9487" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9487.jpg" +"9488" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9488.jpg" +"9489" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9489.jpg" +"9490" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9490.jpg" +"9491" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9491.jpg" +"9492" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9492.jpg" +"9493" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9493.jpg" +"9494" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9494.jpg" +"9495" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9495.jpg" +"9496" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9496.jpg" +"9497" "Is there a toilet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9497.jpg" +"9498" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9498.jpg" +"9499" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9499.jpg" +"9500" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9500.jpg" +"9501" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9501.jpg" +"9502" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9502.jpg" +"9503" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9503.jpg" +"9504" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9504.jpg" +"9505" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9505.jpg" +"9506" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9506.jpg" +"9507" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9507.jpg" +"9508" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9508.jpg" +"9509" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9509.jpg" +"9510" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9510.jpg" +"9511" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9511.jpg" +"9512" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9512.jpg" +"9513" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9513.jpg" +"9514" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9514.jpg" +"9515" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9515.jpg" +"9516" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9516.jpg" +"9517" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9517.jpg" +"9518" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9518.jpg" +"9519" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9519.jpg" +"9520" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9520.jpg" +"9521" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9521.jpg" +"9522" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9522.jpg" +"9523" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9523.jpg" +"9524" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9524.jpg" +"9525" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9525.jpg" +"9526" "Is there a candle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9526.jpg" +"9527" "Is there a steak in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9527.jpg" +"9528" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9528.jpg" +"9529" "Is there a wine in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9529.jpg" +"9530" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9530.jpg" +"9531" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9531.jpg" +"9532" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9532.jpg" +"9533" "Is there a glass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9533.jpg" +"9534" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9534.jpg" +"9535" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9535.jpg" +"9536" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9536.jpg" +"9537" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9537.jpg" +"9538" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9538.jpg" +"9539" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9539.jpg" +"9540" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9540.jpg" +"9541" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9541.jpg" +"9542" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9542.jpg" +"9543" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9543.jpg" +"9544" "Is there a bookshelf in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9544.jpg" +"9545" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9545.jpg" +"9546" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9546.jpg" +"9547" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9547.jpg" +"9548" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9548.jpg" +"9549" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9549.jpg" +"9550" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9550.jpg" +"9551" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9551.jpg" +"9552" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9552.jpg" +"9553" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9553.jpg" +"9554" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9554.jpg" +"9555" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9555.jpg" +"9556" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9556.jpg" +"9557" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9557.jpg" +"9558" "Is there a monkey in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9558.jpg" +"9559" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9559.jpg" +"9560" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9560.jpg" +"9561" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9561.jpg" +"9562" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9562.jpg" +"9563" "Is there a cushion in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9563.jpg" +"9564" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9564.jpg" +"9565" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9565.jpg" +"9566" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9566.jpg" +"9567" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9567.jpg" +"9568" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9568.jpg" +"9569" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9569.jpg" +"9570" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9570.jpg" +"9571" "Is there a rainbow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9571.jpg" +"9572" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9572.jpg" +"9573" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9573.jpg" +"9574" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9574.jpg" +"9575" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9575.jpg" +"9576" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9576.jpg" +"9577" "Is there a cushion in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9577.jpg" +"9578" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9578.jpg" +"9579" "Is there a cage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9579.jpg" +"9580" "Is there a basin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9580.jpg" +"9581" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9581.jpg" +"9582" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9582.jpg" +"9583" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9583.jpg" +"9584" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9584.jpg" +"9585" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9585.jpg" +"9586" "Is there a stair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9586.jpg" +"9587" "Is there a railing in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9587.jpg" +"9588" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9588.jpg" +"9589" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9589.jpg" +"9590" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9590.jpg" +"9591" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9591.jpg" +"9592" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9592.jpg" +"9593" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9593.jpg" +"9594" "Is there a cushion in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9594.jpg" +"9595" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9595.jpg" +"9596" "Is there a kettle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9596.jpg" +"9597" "Is there a trough in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9597.jpg" +"9598" "Is there a cooker in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9598.jpg" +"9599" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9599.jpg" +"9600" "Is there a refrigerator in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9600.jpg" +"9601" "Is there a lion in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9601.jpg" +"9602" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9602.jpg" +"9603" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9603.jpg" +"9604" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9604.jpg" +"9605" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9605.jpg" +"9606" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9606.jpg" +"9607" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9607.jpg" +"9608" "Is there a fishnet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9608.jpg" +"9609" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9609.jpg" +"9610" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9610.jpg" +"9611" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9611.jpg" +"9612" "Is there a pen in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9612.jpg" +"9613" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9613.jpg" +"9614" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9614.jpg" +"9615" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9615.jpg" +"9616" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9616.jpg" +"9617" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9617.jpg" +"9618" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9618.jpg" +"9619" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9619.jpg" +"9620" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9620.jpg" +"9621" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9621.jpg" +"9622" "Is there a dresser in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9622.jpg" +"9623" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9623.jpg" +"9624" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9624.jpg" +"9625" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9625.jpg" +"9626" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9626.jpg" +"9627" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9627.jpg" +"9628" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9628.jpg" +"9629" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9629.jpg" +"9630" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9630.jpg" +"9631" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9631.jpg" +"9632" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9632.jpg" +"9633" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9633.jpg" +"9634" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9634.jpg" +"9635" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9635.jpg" +"9636" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9636.jpg" +"9637" "Is there a guardrail in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9637.jpg" +"9638" "Is there a signal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9638.jpg" +"9639" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9639.jpg" +"9640" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9640.jpg" +"9641" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9641.jpg" +"9642" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9642.jpg" +"9643" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9643.jpg" +"9644" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9644.jpg" +"9645" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9645.jpg" +"9646" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9646.jpg" +"9647" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9647.jpg" +"9648" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9648.jpg" +"9649" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9649.jpg" +"9650" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9650.jpg" +"9651" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9651.jpg" +"9652" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9652.jpg" +"9653" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9653.jpg" +"9654" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9654.jpg" +"9655" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9655.jpg" +"9656" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9656.jpg" +"9657" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9657.jpg" +"9658" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9658.jpg" +"9659" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9659.jpg" +"9660" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9660.jpg" +"9661" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9661.jpg" +"9662" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9662.jpg" +"9663" "Is there a rail in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9663.jpg" +"9664" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9664.jpg" +"9665" "Is there a luggage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9665.jpg" +"9666" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9666.jpg" +"9667" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9667.jpg" +"9668" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9668.jpg" +"9669" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9669.jpg" +"9670" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9670.jpg" +"9671" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9671.jpg" +"9672" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9672.jpg" +"9673" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9673.jpg" +"9674" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9674.jpg" +"9675" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9675.jpg" +"9676" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9676.jpg" +"9677" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9677.jpg" +"9678" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9678.jpg" +"9679" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9679.jpg" +"9680" "Is there a pot in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9680.jpg" +"9681" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9681.jpg" +"9682" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9682.jpg" +"9683" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9683.jpg" +"9684" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9684.jpg" +"9685" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9685.jpg" +"9686" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9686.jpg" +"9687" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9687.jpg" +"9688" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9688.jpg" +"9689" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9689.jpg" +"9690" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9690.jpg" +"9691" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9691.jpg" +"9692" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9692.jpg" +"9693" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9693.jpg" +"9694" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9694.jpg" +"9695" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9695.jpg" +"9696" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9696.jpg" +"9697" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9697.jpg" +"9698" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9698.jpg" +"9699" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9699.jpg" +"9700" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9700.jpg" +"9701" "Is there a zebra in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9701.jpg" +"9702" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9702.jpg" +"9703" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9703.jpg" +"9704" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9704.jpg" +"9705" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9705.jpg" +"9706" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9706.jpg" +"9707" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9707.jpg" +"9708" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9708.jpg" +"9709" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9709.jpg" +"9710" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9710.jpg" +"9711" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9711.jpg" +"9712" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9712.jpg" +"9713" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9713.jpg" +"9714" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9714.jpg" +"9715" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9715.jpg" +"9716" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9716.jpg" +"9717" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9717.jpg" +"9718" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9718.jpg" +"9719" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9719.jpg" +"9720" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9720.jpg" +"9721" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9721.jpg" +"9722" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9722.jpg" +"9723" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9723.jpg" +"9724" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9724.jpg" +"9725" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9725.jpg" +"9726" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9726.jpg" +"9727" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9727.jpg" +"9728" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9728.jpg" +"9729" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9729.jpg" +"9730" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9730.jpg" +"9731" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9731.jpg" +"9732" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9732.jpg" +"9733" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9733.jpg" +"9734" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9734.jpg" +"9735" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9735.jpg" +"9736" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9736.jpg" +"9737" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9737.jpg" +"9738" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9738.jpg" +"9739" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9739.jpg" +"9740" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9740.jpg" +"9741" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9741.jpg" +"9742" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9742.jpg" +"9743" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9743.jpg" +"9744" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9744.jpg" +"9745" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9745.jpg" +"9746" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9746.jpg" +"9747" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9747.jpg" +"9748" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9748.jpg" +"9749" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9749.jpg" +"9750" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9750.jpg" +"9751" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9751.jpg" +"9752" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9752.jpg" +"9753" "Is there a rope in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9753.jpg" +"9754" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9754.jpg" +"9755" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9755.jpg" +"9756" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9756.jpg" +"9757" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9757.jpg" +"9758" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9758.jpg" +"9759" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9759.jpg" +"9760" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9760.jpg" +"9761" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9761.jpg" +"9762" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9762.jpg" +"9763" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9763.jpg" +"9764" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9764.jpg" +"9765" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9765.jpg" +"9766" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9766.jpg" +"9767" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9767.jpg" +"9768" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9768.jpg" +"9769" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9769.jpg" +"9770" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9770.jpg" +"9771" "Is there a elephant in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9771.jpg" +"9772" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9772.jpg" +"9773" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9773.jpg" +"9774" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9774.jpg" +"9775" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9775.jpg" +"9776" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9776.jpg" +"9777" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9777.jpg" +"9778" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9778.jpg" +"9779" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9779.jpg" +"9780" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9780.jpg" +"9781" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9781.jpg" +"9782" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9782.jpg" +"9783" "Is there a shampoo in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9783.jpg" +"9784" "Is there a shampoo in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9784.jpg" +"9785" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9785.jpg" +"9786" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9786.jpg" +"9787" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9787.jpg" +"9788" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9788.jpg" +"9789" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9789.jpg" +"9790" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9790.jpg" +"9791" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9791.jpg" +"9792" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9792.jpg" +"9793" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9793.jpg" +"9794" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9794.jpg" +"9795" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9795.jpg" +"9796" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9796.jpg" +"9797" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9797.jpg" +"9798" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9798.jpg" +"9799" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9799.jpg" +"9800" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9800.jpg" +"9801" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9801.jpg" +"9802" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9802.jpg" +"9803" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9803.jpg" +"9804" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9804.jpg" +"9805" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9805.jpg" +"9806" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9806.jpg" +"9807" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9807.jpg" +"9808" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9808.jpg" +"9809" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9809.jpg" +"9810" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9810.jpg" +"9811" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9811.jpg" +"9812" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9812.jpg" +"9813" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9813.jpg" +"9814" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9814.jpg" +"9815" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9815.jpg" +"9816" "Is there a zebra in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9816.jpg" +"9817" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9817.jpg" +"9818" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9818.jpg" +"9819" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9819.jpg" +"9820" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9820.jpg" +"9821" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9821.jpg" +"9822" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9822.jpg" +"9823" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9823.jpg" +"9824" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9824.jpg" +"9825" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9825.jpg" +"9826" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9826.jpg" +"9827" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9827.jpg" +"9828" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9828.jpg" +"9829" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9829.jpg" +"9830" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9830.jpg" +"9831" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9831.jpg" +"9832" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9832.jpg" +"9833" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9833.jpg" +"9834" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9834.jpg" +"9835" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9835.jpg" +"9836" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9836.jpg" +"9837" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9837.jpg" +"9838" "Is there a duck in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9838.jpg" +"9839" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9839.jpg" +"9840" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9840.jpg" +"9841" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9841.jpg" +"9842" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9842.jpg" +"9843" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9843.jpg" +"9844" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9844.jpg" +"9845" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9845.jpg" +"9846" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9846.jpg" +"9847" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9847.jpg" +"9848" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9848.jpg" +"9849" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9849.jpg" +"9850" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9850.jpg" +"9851" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9851.jpg" +"9852" "Is there a pole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9852.jpg" +"9853" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9853.jpg" +"9854" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9854.jpg" +"9855" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9855.jpg" +"9856" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9856.jpg" +"9857" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9857.jpg" +"9858" "Is there a drink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9858.jpg" +"9859" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9859.jpg" +"9860" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9860.jpg" +"9861" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9861.jpg" +"9862" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9862.jpg" +"9863" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9863.jpg" +"9864" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9864.jpg" +"9865" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9865.jpg" +"9866" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9866.jpg" +"9867" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9867.jpg" +"9868" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9868.jpg" +"9869" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9869.jpg" +"9870" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9870.jpg" +"9871" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9871.jpg" +"9872" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9872.jpg" +"9873" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9873.jpg" +"9874" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9874.jpg" +"9875" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9875.jpg" +"9876" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9876.jpg" +"9877" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9877.jpg" +"9878" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9878.jpg" +"9879" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9879.jpg" +"9880" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9880.jpg" +"9881" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9881.jpg" +"9882" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9882.jpg" +"9883" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9883.jpg" +"9884" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9884.jpg" +"9885" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9885.jpg" +"9886" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9886.jpg" +"9887" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9887.jpg" +"9888" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9888.jpg" +"9889" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9889.jpg" +"9890" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9890.jpg" +"9891" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9891.jpg" +"9892" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9892.jpg" +"9893" "Is there a eagle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9893.jpg" +"9894" "Is there a plane in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9894.jpg" +"9895" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9895.jpg" +"9896" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9896.jpg" +"9897" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9897.jpg" +"9898" "Is there a air-conditioning in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9898.jpg" +"9899" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9899.jpg" +"9900" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9900.jpg" +"9901" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9901.jpg" +"9902" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9902.jpg" +"9903" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9903.jpg" +"9904" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9904.jpg" +"9905" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9905.jpg" +"9906" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9906.jpg" +"9907" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9907.jpg" +"9908" "Is there a earphone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9908.jpg" +"9909" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9909.jpg" +"9910" "Is there a shell in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9910.jpg" +"9911" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9911.jpg" +"9912" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9912.jpg" +"9913" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9913.jpg" +"9914" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9914.jpg" +"9915" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9915.jpg" +"9916" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9916.jpg" +"9917" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9917.jpg" +"9918" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9918.jpg" +"9919" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9919.jpg" +"9920" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9920.jpg" +"9921" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9921.jpg" +"9922" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9922.jpg" +"9923" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9923.jpg" +"9924" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9924.jpg" +"9925" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9925.jpg" +"9926" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9926.jpg" +"9927" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9927.jpg" +"9928" "Is there a leopard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9928.jpg" +"9929" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9929.jpg" +"9930" "Is there a crocodile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9930.jpg" +"9931" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9931.jpg" +"9932" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9932.jpg" +"9933" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9933.jpg" +"9934" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9934.jpg" +"9935" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9935.jpg" +"9936" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9936.jpg" +"9937" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9937.jpg" +"9938" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9938.jpg" +"9939" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9939.jpg" +"9940" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9940.jpg" +"9941" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9941.jpg" +"9942" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9942.jpg" +"9943" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9943.jpg" +"9944" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9944.jpg" +"9945" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9945.jpg" +"9946" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9946.jpg" +"9947" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9947.jpg" +"9948" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9948.jpg" +"9949" "Is there a bed in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9949.jpg" +"9950" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9950.jpg" +"9951" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9951.jpg" +"9952" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9952.jpg" +"9953" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9953.jpg" +"9954" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9954.jpg" +"9955" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9955.jpg" +"9956" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9956.jpg" +"9957" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9957.jpg" +"9958" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9958.jpg" +"9959" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9959.jpg" +"9960" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9960.jpg" +"9961" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9961.jpg" +"9962" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9962.jpg" +"9963" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9963.jpg" +"9964" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9964.jpg" +"9965" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9965.jpg" +"9966" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9966.jpg" +"9967" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9967.jpg" +"9968" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9968.jpg" +"9969" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9969.jpg" +"9970" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9970.jpg" +"9971" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9971.jpg" +"9972" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9972.jpg" +"9973" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9973.jpg" +"9974" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9974.jpg" +"9975" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9975.jpg" +"9976" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9976.jpg" +"9977" "Is there a glacier in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9977.jpg" +"9978" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9978.jpg" +"9979" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9979.jpg" +"9980" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9980.jpg" +"9981" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9981.jpg" +"9982" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9982.jpg" +"9983" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9983.jpg" +"9984" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9984.jpg" +"9985" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9985.jpg" +"9986" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9986.jpg" +"9987" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9987.jpg" +"9988" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9988.jpg" +"9989" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9989.jpg" +"9990" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9990.jpg" +"9991" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9991.jpg" +"9992" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9992.jpg" +"9993" "Is there a pad in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9993.jpg" +"9994" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9994.jpg" +"9995" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9995.jpg" +"9996" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9996.jpg" +"9997" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9997.jpg" +"9998" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9998.jpg" +"9999" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/9999.jpg" +"10000" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10000.jpg" +"10001" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10001.jpg" +"10002" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10002.jpg" +"10003" "Is there a elephant in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10003.jpg" +"10004" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10004.jpg" +"10005" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10005.jpg" +"10006" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10006.jpg" +"10007" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10007.jpg" +"10008" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10008.jpg" +"10009" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10009.jpg" +"10010" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10010.jpg" +"10011" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10011.jpg" +"10012" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10012.jpg" +"10013" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10013.jpg" +"10014" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10014.jpg" +"10015" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10015.jpg" +"10016" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10016.jpg" +"10017" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10017.jpg" +"10018" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10018.jpg" +"10019" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10019.jpg" +"10020" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10020.jpg" +"10021" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10021.jpg" +"10022" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10022.jpg" +"10023" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10023.jpg" +"10024" "Is there a bus in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10024.jpg" +"10025" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10025.jpg" +"10026" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10026.jpg" +"10027" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10027.jpg" +"10028" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10028.jpg" +"10029" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10029.jpg" +"10030" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10030.jpg" +"10031" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10031.jpg" +"10032" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10032.jpg" +"10033" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10033.jpg" +"10034" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10034.jpg" +"10035" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10035.jpg" +"10036" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10036.jpg" +"10037" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10037.jpg" +"10038" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10038.jpg" +"10039" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10039.jpg" +"10040" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10040.jpg" +"10041" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10041.jpg" +"10042" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10042.jpg" +"10043" "Is there a sailing in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10043.jpg" +"10044" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10044.jpg" +"10045" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10045.jpg" +"10046" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10046.jpg" +"10047" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10047.jpg" +"10048" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10048.jpg" +"10049" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10049.jpg" +"10050" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10050.jpg" +"10051" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10051.jpg" +"10052" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10052.jpg" +"10053" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10053.jpg" +"10054" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10054.jpg" +"10055" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10055.jpg" +"10056" "Is there a cake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10056.jpg" +"10057" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10057.jpg" +"10058" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10058.jpg" +"10059" "Is there a newspaper in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10059.jpg" +"10060" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10060.jpg" +"10061" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10061.jpg" +"10062" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10062.jpg" +"10063" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10063.jpg" +"10064" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10064.jpg" +"10065" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10065.jpg" +"10066" "Is there a bus in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10066.jpg" +"10067" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10067.jpg" +"10068" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10068.jpg" +"10069" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10069.jpg" +"10070" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10070.jpg" +"10071" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10071.jpg" +"10072" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10072.jpg" +"10073" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10073.jpg" +"10074" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10074.jpg" +"10075" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10075.jpg" +"10076" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10076.jpg" +"10077" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10077.jpg" +"10078" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10078.jpg" +"10079" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10079.jpg" +"10080" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10080.jpg" +"10081" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10081.jpg" +"10082" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10082.jpg" +"10083" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10083.jpg" +"10084" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10084.jpg" +"10085" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10085.jpg" +"10086" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10086.jpg" +"10087" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10087.jpg" +"10088" "Is there a pole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10088.jpg" +"10089" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10089.jpg" +"10090" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10090.jpg" +"10091" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10091.jpg" +"10092" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10092.jpg" +"10093" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10093.jpg" +"10094" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10094.jpg" +"10095" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10095.jpg" +"10096" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10096.jpg" +"10097" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10097.jpg" +"10098" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10098.jpg" +"10099" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10099.jpg" +"10100" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10100.jpg" +"10101" "Is there a bus in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10101.jpg" +"10102" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10102.jpg" +"10103" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10103.jpg" +"10104" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10104.jpg" +"10105" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10105.jpg" +"10106" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10106.jpg" +"10107" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10107.jpg" +"10108" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10108.jpg" +"10109" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10109.jpg" +"10110" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10110.jpg" +"10111" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10111.jpg" +"10112" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10112.jpg" +"10113" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10113.jpg" +"10114" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10114.jpg" +"10115" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10115.jpg" +"10116" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10116.jpg" +"10117" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10117.jpg" +"10118" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10118.jpg" +"10119" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10119.jpg" +"10120" "Is there a elephant in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10120.jpg" +"10121" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10121.jpg" +"10122" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10122.jpg" +"10123" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10123.jpg" +"10124" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10124.jpg" +"10125" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10125.jpg" +"10126" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10126.jpg" +"10127" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10127.jpg" +"10128" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10128.jpg" +"10129" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10129.jpg" +"10130" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10130.jpg" +"10131" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10131.jpg" +"10132" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10132.jpg" +"10133" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10133.jpg" +"10134" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10134.jpg" +"10135" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10135.jpg" +"10136" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10136.jpg" +"10137" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10137.jpg" +"10138" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10138.jpg" +"10139" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10139.jpg" +"10140" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10140.jpg" +"10141" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10141.jpg" +"10142" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10142.jpg" +"10143" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10143.jpg" +"10144" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10144.jpg" +"10145" "Is there a elephant in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10145.jpg" +"10146" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10146.jpg" +"10147" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10147.jpg" +"10148" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10148.jpg" +"10149" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10149.jpg" +"10150" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10150.jpg" +"10151" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10151.jpg" +"10152" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10152.jpg" +"10153" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10153.jpg" +"10154" "Is there a sailing in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10154.jpg" +"10155" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10155.jpg" +"10156" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10156.jpg" +"10157" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10157.jpg" +"10158" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10158.jpg" +"10159" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10159.jpg" +"10160" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10160.jpg" +"10161" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10161.jpg" +"10162" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10162.jpg" +"10163" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10163.jpg" +"10164" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10164.jpg" +"10165" "Is there a luggage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10165.jpg" +"10166" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10166.jpg" +"10167" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10167.jpg" +"10168" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10168.jpg" +"10169" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10169.jpg" +"10170" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10170.jpg" +"10171" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10171.jpg" +"10172" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10172.jpg" +"10173" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10173.jpg" +"10174" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10174.jpg" +"10175" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10175.jpg" +"10176" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10176.jpg" +"10177" "Is there a luggage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10177.jpg" +"10178" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10178.jpg" +"10179" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10179.jpg" +"10180" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10180.jpg" +"10181" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10181.jpg" +"10182" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10182.jpg" +"10183" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10183.jpg" +"10184" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10184.jpg" +"10185" "Is there a butterfly in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10185.jpg" +"10186" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10186.jpg" +"10187" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10187.jpg" +"10188" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10188.jpg" +"10189" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10189.jpg" +"10190" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10190.jpg" +"10191" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10191.jpg" +"10192" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10192.jpg" +"10193" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10193.jpg" +"10194" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10194.jpg" +"10195" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10195.jpg" +"10196" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10196.jpg" +"10197" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10197.jpg" +"10198" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10198.jpg" +"10199" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10199.jpg" +"10200" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10200.jpg" +"10201" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10201.jpg" +"10202" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10202.jpg" +"10203" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10203.jpg" +"10204" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10204.jpg" +"10205" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10205.jpg" +"10206" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10206.jpg" +"10207" "Is there a butterfly in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10207.jpg" +"10208" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10208.jpg" +"10209" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10209.jpg" +"10210" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10210.jpg" +"10211" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10211.jpg" +"10212" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10212.jpg" +"10213" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10213.jpg" +"10214" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10214.jpg" +"10215" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10215.jpg" +"10216" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10216.jpg" +"10217" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10217.jpg" +"10218" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10218.jpg" +"10219" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10219.jpg" +"10220" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10220.jpg" +"10221" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10221.jpg" +"10222" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10222.jpg" +"10223" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10223.jpg" +"10224" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10224.jpg" +"10225" "Is there a basin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10225.jpg" +"10226" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10226.jpg" +"10227" "Is there a cushion in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10227.jpg" +"10228" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10228.jpg" +"10229" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10229.jpg" +"10230" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10230.jpg" +"10231" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10231.jpg" +"10232" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10232.jpg" +"10233" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10233.jpg" +"10234" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10234.jpg" +"10235" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10235.jpg" +"10236" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10236.jpg" +"10237" "Is there a earphone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10237.jpg" +"10238" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10238.jpg" +"10239" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10239.jpg" +"10240" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10240.jpg" +"10241" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10241.jpg" +"10242" "Is there a fishnet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10242.jpg" +"10243" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10243.jpg" +"10244" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10244.jpg" +"10245" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10245.jpg" +"10246" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10246.jpg" +"10247" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10247.jpg" +"10248" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10248.jpg" +"10249" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10249.jpg" +"10250" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10250.jpg" +"10251" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10251.jpg" +"10252" "Is there a rabbit in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10252.jpg" +"10253" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10253.jpg" +"10254" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10254.jpg" +"10255" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10255.jpg" +"10256" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10256.jpg" +"10257" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10257.jpg" +"10258" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10258.jpg" +"10259" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10259.jpg" +"10260" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10260.jpg" +"10261" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10261.jpg" +"10262" "Is there a bridge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10262.jpg" +"10263" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10263.jpg" +"10264" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10264.jpg" +"10265" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10265.jpg" +"10266" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10266.jpg" +"10267" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10267.jpg" +"10268" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10268.jpg" +"10269" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10269.jpg" +"10270" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10270.jpg" +"10271" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10271.jpg" +"10272" "Is there a brush in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10272.jpg" +"10273" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10273.jpg" +"10274" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10274.jpg" +"10275" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10275.jpg" +"10276" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10276.jpg" +"10277" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10277.jpg" +"10278" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10278.jpg" +"10279" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10279.jpg" +"10280" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10280.jpg" +"10281" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10281.jpg" +"10282" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10282.jpg" +"10283" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10283.jpg" +"10284" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10284.jpg" +"10285" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10285.jpg" +"10286" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10286.jpg" +"10287" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10287.jpg" +"10288" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10288.jpg" +"10289" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10289.jpg" +"10290" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10290.jpg" +"10291" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10291.jpg" +"10292" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10292.jpg" +"10293" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10293.jpg" +"10294" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10294.jpg" +"10295" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10295.jpg" +"10296" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10296.jpg" +"10297" "Is there a paper in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10297.jpg" +"10298" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10298.jpg" +"10299" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10299.jpg" +"10300" "Is there a support in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10300.jpg" +"10301" "Is there a toilet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10301.jpg" +"10302" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10302.jpg" +"10303" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10303.jpg" +"10304" "Is there a yacht in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10304.jpg" +"10305" "Is there a buoy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10305.jpg" +"10306" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10306.jpg" +"10307" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10307.jpg" +"10308" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10308.jpg" +"10309" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10309.jpg" +"10310" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10310.jpg" +"10311" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10311.jpg" +"10312" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10312.jpg" +"10313" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10313.jpg" +"10314" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10314.jpg" +"10315" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10315.jpg" +"10316" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10316.jpg" +"10317" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10317.jpg" +"10318" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10318.jpg" +"10319" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10319.jpg" +"10320" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10320.jpg" +"10321" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10321.jpg" +"10322" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10322.jpg" +"10323" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10323.jpg" +"10324" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10324.jpg" +"10325" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10325.jpg" +"10326" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10326.jpg" +"10327" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10327.jpg" +"10328" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10328.jpg" +"10329" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10329.jpg" +"10330" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10330.jpg" +"10331" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10331.jpg" +"10332" "Is there a paper in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10332.jpg" +"10333" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10333.jpg" +"10334" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10334.jpg" +"10335" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10335.jpg" +"10336" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10336.jpg" +"10337" "Is there a dustbin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10337.jpg" +"10338" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10338.jpg" +"10339" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10339.jpg" +"10340" "Is there a socket in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10340.jpg" +"10341" "Is there a charger in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10341.jpg" +"10342" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10342.jpg" +"10343" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10343.jpg" +"10344" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10344.jpg" +"10345" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10345.jpg" +"10346" "Is there a toothbrush in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10346.jpg" +"10347" "Is there a dryer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10347.jpg" +"10348" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10348.jpg" +"10349" "Is there a hanger in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10349.jpg" +"10350" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10350.jpg" +"10351" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10351.jpg" +"10352" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10352.jpg" +"10353" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10353.jpg" +"10354" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10354.jpg" +"10355" "Is there a cable in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10355.jpg" +"10356" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10356.jpg" +"10357" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10357.jpg" +"10358" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10358.jpg" +"10359" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10359.jpg" +"10360" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10360.jpg" +"10361" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10361.jpg" +"10362" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10362.jpg" +"10363" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10363.jpg" +"10364" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10364.jpg" +"10365" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10365.jpg" +"10366" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10366.jpg" +"10367" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10367.jpg" +"10368" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10368.jpg" +"10369" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10369.jpg" +"10370" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10370.jpg" +"10371" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10371.jpg" +"10372" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10372.jpg" +"10373" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10373.jpg" +"10374" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10374.jpg" +"10375" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10375.jpg" +"10376" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10376.jpg" +"10377" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10377.jpg" +"10378" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10378.jpg" +"10379" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10379.jpg" +"10380" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10380.jpg" +"10381" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10381.jpg" +"10382" "Is there a paper in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10382.jpg" +"10383" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10383.jpg" +"10384" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10384.jpg" +"10385" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10385.jpg" +"10386" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10386.jpg" +"10387" "Is there a dustbin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10387.jpg" +"10388" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10388.jpg" +"10389" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10389.jpg" +"10390" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10390.jpg" +"10391" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10391.jpg" +"10392" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10392.jpg" +"10393" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10393.jpg" +"10394" "Is there a leopard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10394.jpg" +"10395" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10395.jpg" +"10396" "Is there a antelope in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10396.jpg" +"10397" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10397.jpg" +"10398" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10398.jpg" +"10399" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10399.jpg" +"10400" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10400.jpg" +"10401" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10401.jpg" +"10402" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10402.jpg" +"10403" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10403.jpg" +"10404" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10404.jpg" +"10405" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10405.jpg" +"10406" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10406.jpg" +"10407" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10407.jpg" +"10408" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10408.jpg" +"10409" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10409.jpg" +"10410" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10410.jpg" +"10411" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10411.jpg" +"10412" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10412.jpg" +"10413" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10413.jpg" +"10414" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10414.jpg" +"10415" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10415.jpg" +"10416" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10416.jpg" +"10417" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10417.jpg" +"10418" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10418.jpg" +"10419" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10419.jpg" +"10420" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10420.jpg" +"10421" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10421.jpg" +"10422" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10422.jpg" +"10423" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10423.jpg" +"10424" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10424.jpg" +"10425" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10425.jpg" +"10426" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10426.jpg" +"10427" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10427.jpg" +"10428" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10428.jpg" +"10429" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10429.jpg" +"10430" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10430.jpg" +"10431" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10431.jpg" +"10432" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10432.jpg" +"10433" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10433.jpg" +"10434" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10434.jpg" +"10435" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10435.jpg" +"10436" "Is there a bath in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10436.jpg" +"10437" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10437.jpg" +"10438" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10438.jpg" +"10439" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10439.jpg" +"10440" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10440.jpg" +"10441" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10441.jpg" +"10442" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10442.jpg" +"10443" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10443.jpg" +"10444" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10444.jpg" +"10445" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10445.jpg" +"10446" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10446.jpg" +"10447" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10447.jpg" +"10448" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10448.jpg" +"10449" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10449.jpg" +"10450" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10450.jpg" +"10451" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10451.jpg" +"10452" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10452.jpg" +"10453" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10453.jpg" +"10454" "Is there a bath in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10454.jpg" +"10455" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10455.jpg" +"10456" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10456.jpg" +"10457" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10457.jpg" +"10458" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10458.jpg" +"10459" "Is there a drink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10459.jpg" +"10460" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10460.jpg" +"10461" "Is there a sunglasses in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10461.jpg" +"10462" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10462.jpg" +"10463" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10463.jpg" +"10464" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10464.jpg" +"10465" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10465.jpg" +"10466" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10466.jpg" +"10467" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10467.jpg" +"10468" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10468.jpg" +"10469" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10469.jpg" +"10470" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10470.jpg" +"10471" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10471.jpg" +"10472" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10472.jpg" +"10473" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10473.jpg" +"10474" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10474.jpg" +"10475" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10475.jpg" +"10476" "Is there a mousepad in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10476.jpg" +"10477" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10477.jpg" +"10478" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10478.jpg" +"10479" "Is there a cone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10479.jpg" +"10480" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10480.jpg" +"10481" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10481.jpg" +"10482" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10482.jpg" +"10483" "Is there a mousepad in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10483.jpg" +"10484" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10484.jpg" +"10485" "Is there a pillow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10485.jpg" +"10486" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10486.jpg" +"10487" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10487.jpg" +"10488" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10488.jpg" +"10489" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10489.jpg" +"10490" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10490.jpg" +"10491" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10491.jpg" +"10492" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10492.jpg" +"10493" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10493.jpg" +"10494" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10494.jpg" +"10495" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10495.jpg" +"10496" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10496.jpg" +"10497" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10497.jpg" +"10498" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10498.jpg" +"10499" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10499.jpg" +"10500" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10500.jpg" +"10501" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10501.jpg" +"10502" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10502.jpg" +"10503" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10503.jpg" +"10504" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10504.jpg" +"10505" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10505.jpg" +"10506" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10506.jpg" +"10507" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10507.jpg" +"10508" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10508.jpg" +"10509" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10509.jpg" +"10510" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10510.jpg" +"10511" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10511.jpg" +"10512" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10512.jpg" +"10513" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10513.jpg" +"10514" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10514.jpg" +"10515" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10515.jpg" +"10516" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10516.jpg" +"10517" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10517.jpg" +"10518" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10518.jpg" +"10519" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10519.jpg" +"10520" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10520.jpg" +"10521" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10521.jpg" +"10522" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10522.jpg" +"10523" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10523.jpg" +"10524" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10524.jpg" +"10525" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10525.jpg" +"10526" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10526.jpg" +"10527" "Is there a plane in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10527.jpg" +"10528" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10528.jpg" +"10529" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10529.jpg" +"10530" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10530.jpg" +"10531" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10531.jpg" +"10532" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10532.jpg" +"10533" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10533.jpg" +"10534" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10534.jpg" +"10535" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10535.jpg" +"10536" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10536.jpg" +"10537" "Is there a luggage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10537.jpg" +"10538" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10538.jpg" +"10539" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10539.jpg" +"10540" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10540.jpg" +"10541" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10541.jpg" +"10542" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10542.jpg" +"10543" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10543.jpg" +"10544" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10544.jpg" +"10545" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10545.jpg" +"10546" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10546.jpg" +"10547" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10547.jpg" +"10548" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10548.jpg" +"10549" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10549.jpg" +"10550" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10550.jpg" +"10551" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10551.jpg" +"10552" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10552.jpg" +"10553" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10553.jpg" +"10554" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10554.jpg" +"10555" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10555.jpg" +"10556" "Is there a pole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10556.jpg" +"10557" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10557.jpg" +"10558" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10558.jpg" +"10559" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10559.jpg" +"10560" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10560.jpg" +"10561" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10561.jpg" +"10562" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10562.jpg" +"10563" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10563.jpg" +"10564" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10564.jpg" +"10565" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10565.jpg" +"10566" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10566.jpg" +"10567" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10567.jpg" +"10568" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10568.jpg" +"10569" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10569.jpg" +"10570" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10570.jpg" +"10571" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10571.jpg" +"10572" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10572.jpg" +"10573" "Is there a slippers in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10573.jpg" +"10574" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10574.jpg" +"10575" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10575.jpg" +"10576" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10576.jpg" +"10577" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10577.jpg" +"10578" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10578.jpg" +"10579" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10579.jpg" +"10580" "Is there a dresser in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10580.jpg" +"10581" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10581.jpg" +"10582" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10582.jpg" +"10583" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10583.jpg" +"10584" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10584.jpg" +"10585" "Is there a doghole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10585.jpg" +"10586" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10586.jpg" +"10587" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10587.jpg" +"10588" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10588.jpg" +"10589" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10589.jpg" +"10590" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10590.jpg" +"10591" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10591.jpg" +"10592" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10592.jpg" +"10593" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10593.jpg" +"10594" "Is there a elephant in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10594.jpg" +"10595" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10595.jpg" +"10596" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10596.jpg" +"10597" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10597.jpg" +"10598" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10598.jpg" +"10599" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10599.jpg" +"10600" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10600.jpg" +"10601" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10601.jpg" +"10602" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10602.jpg" +"10603" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10603.jpg" +"10604" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10604.jpg" +"10605" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10605.jpg" +"10606" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10606.jpg" +"10607" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10607.jpg" +"10608" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10608.jpg" +"10609" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10609.jpg" +"10610" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10610.jpg" +"10611" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10611.jpg" +"10612" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10612.jpg" +"10613" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10613.jpg" +"10614" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10614.jpg" +"10615" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10615.jpg" +"10616" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10616.jpg" +"10617" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10617.jpg" +"10618" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10618.jpg" +"10619" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10619.jpg" +"10620" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10620.jpg" +"10621" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10621.jpg" +"10622" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10622.jpg" +"10623" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10623.jpg" +"10624" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10624.jpg" +"10625" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10625.jpg" +"10626" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10626.jpg" +"10627" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10627.jpg" +"10628" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10628.jpg" +"10629" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10629.jpg" +"10630" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10630.jpg" +"10631" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10631.jpg" +"10632" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10632.jpg" +"10633" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10633.jpg" +"10634" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10634.jpg" +"10635" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10635.jpg" +"10636" "Is there a banana in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10636.jpg" +"10637" "Is there a bread in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10637.jpg" +"10638" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10638.jpg" +"10639" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10639.jpg" +"10640" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10640.jpg" +"10641" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10641.jpg" +"10642" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10642.jpg" +"10643" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10643.jpg" +"10644" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10644.jpg" +"10645" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10645.jpg" +"10646" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10646.jpg" +"10647" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10647.jpg" +"10648" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10648.jpg" +"10649" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10649.jpg" +"10650" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10650.jpg" +"10651" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10651.jpg" +"10652" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10652.jpg" +"10653" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10653.jpg" +"10654" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10654.jpg" +"10655" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10655.jpg" +"10656" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10656.jpg" +"10657" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10657.jpg" +"10658" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10658.jpg" +"10659" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10659.jpg" +"10660" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10660.jpg" +"10661" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10661.jpg" +"10662" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10662.jpg" +"10663" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10663.jpg" +"10664" "Is there a pad in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10664.jpg" +"10665" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10665.jpg" +"10666" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10666.jpg" +"10667" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10667.jpg" +"10668" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10668.jpg" +"10669" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10669.jpg" +"10670" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10670.jpg" +"10671" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10671.jpg" +"10672" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10672.jpg" +"10673" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10673.jpg" +"10674" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10674.jpg" +"10675" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10675.jpg" +"10676" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10676.jpg" +"10677" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10677.jpg" +"10678" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10678.jpg" +"10679" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10679.jpg" +"10680" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10680.jpg" +"10681" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10681.jpg" +"10682" "Is there a rope in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10682.jpg" +"10683" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10683.jpg" +"10684" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10684.jpg" +"10685" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10685.jpg" +"10686" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10686.jpg" +"10687" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10687.jpg" +"10688" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10688.jpg" +"10689" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10689.jpg" +"10690" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10690.jpg" +"10691" "Is there a toilet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10691.jpg" +"10692" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10692.jpg" +"10693" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10693.jpg" +"10694" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10694.jpg" +"10695" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10695.jpg" +"10696" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10696.jpg" +"10697" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10697.jpg" +"10698" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10698.jpg" +"10699" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10699.jpg" +"10700" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10700.jpg" +"10701" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10701.jpg" +"10702" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10702.jpg" +"10703" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10703.jpg" +"10704" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10704.jpg" +"10705" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10705.jpg" +"10706" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10706.jpg" +"10707" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10707.jpg" +"10708" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10708.jpg" +"10709" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10709.jpg" +"10710" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10710.jpg" +"10711" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10711.jpg" +"10712" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10712.jpg" +"10713" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10713.jpg" +"10714" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10714.jpg" +"10715" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10715.jpg" +"10716" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10716.jpg" +"10717" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10717.jpg" +"10718" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10718.jpg" +"10719" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10719.jpg" +"10720" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10720.jpg" +"10721" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10721.jpg" +"10722" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10722.jpg" +"10723" "Is there a toilet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10723.jpg" +"10724" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10724.jpg" +"10725" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10725.jpg" +"10726" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10726.jpg" +"10727" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10727.jpg" +"10728" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10728.jpg" +"10729" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10729.jpg" +"10730" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10730.jpg" +"10731" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10731.jpg" +"10732" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10732.jpg" +"10733" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10733.jpg" +"10734" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10734.jpg" +"10735" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10735.jpg" +"10736" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10736.jpg" +"10737" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10737.jpg" +"10738" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10738.jpg" +"10739" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10739.jpg" +"10740" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10740.jpg" +"10741" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10741.jpg" +"10742" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10742.jpg" +"10743" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10743.jpg" +"10744" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10744.jpg" +"10745" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10745.jpg" +"10746" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10746.jpg" +"10747" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10747.jpg" +"10748" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10748.jpg" +"10749" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10749.jpg" +"10750" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10750.jpg" +"10751" "Is there a signal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10751.jpg" +"10752" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10752.jpg" +"10753" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10753.jpg" +"10754" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10754.jpg" +"10755" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10755.jpg" +"10756" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10756.jpg" +"10757" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10757.jpg" +"10758" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10758.jpg" +"10759" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10759.jpg" +"10760" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10760.jpg" +"10761" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10761.jpg" +"10762" "Is there a bed in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10762.jpg" +"10763" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10763.jpg" +"10764" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10764.jpg" +"10765" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10765.jpg" +"10766" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10766.jpg" +"10767" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10767.jpg" +"10768" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10768.jpg" +"10769" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10769.jpg" +"10770" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10770.jpg" +"10771" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10771.jpg" +"10772" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10772.jpg" +"10773" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10773.jpg" +"10774" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10774.jpg" +"10775" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10775.jpg" +"10776" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10776.jpg" +"10777" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10777.jpg" +"10778" "Is there a toothpick in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10778.jpg" +"10779" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10779.jpg" +"10780" "Is there a cushion in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10780.jpg" +"10781" "Is there a drink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10781.jpg" +"10782" "Is there a apple in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10782.jpg" +"10783" "Is there a carrot in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10783.jpg" +"10784" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10784.jpg" +"10785" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10785.jpg" +"10786" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10786.jpg" +"10787" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10787.jpg" +"10788" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10788.jpg" +"10789" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10789.jpg" +"10790" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10790.jpg" +"10791" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10791.jpg" +"10792" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10792.jpg" +"10793" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10793.jpg" +"10794" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10794.jpg" +"10795" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10795.jpg" +"10796" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10796.jpg" +"10797" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10797.jpg" +"10798" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10798.jpg" +"10799" "Is there a court in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10799.jpg" +"10800" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10800.jpg" +"10801" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10801.jpg" +"10802" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10802.jpg" +"10803" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10803.jpg" +"10804" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10804.jpg" +"10805" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10805.jpg" +"10806" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10806.jpg" +"10807" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10807.jpg" +"10808" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10808.jpg" +"10809" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10809.jpg" +"10810" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10810.jpg" +"10811" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10811.jpg" +"10812" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10812.jpg" +"10813" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10813.jpg" +"10814" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10814.jpg" +"10815" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10815.jpg" +"10816" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10816.jpg" +"10817" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10817.jpg" +"10818" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10818.jpg" +"10819" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10819.jpg" +"10820" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10820.jpg" +"10821" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10821.jpg" +"10822" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10822.jpg" +"10823" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10823.jpg" +"10824" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10824.jpg" +"10825" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10825.jpg" +"10826" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10826.jpg" +"10827" "Is there a rope in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10827.jpg" +"10828" "Is there a stage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10828.jpg" +"10829" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10829.jpg" +"10830" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10830.jpg" +"10831" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10831.jpg" +"10832" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10832.jpg" +"10833" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10833.jpg" +"10834" "Is there a rabbit in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10834.jpg" +"10835" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10835.jpg" +"10836" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10836.jpg" +"10837" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10837.jpg" +"10838" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10838.jpg" +"10839" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10839.jpg" +"10840" "Is there a truck in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10840.jpg" +"10841" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10841.jpg" +"10842" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10842.jpg" +"10843" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10843.jpg" +"10844" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10844.jpg" +"10845" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10845.jpg" +"10846" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10846.jpg" +"10847" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10847.jpg" +"10848" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10848.jpg" +"10849" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10849.jpg" +"10850" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10850.jpg" +"10851" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10851.jpg" +"10852" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10852.jpg" +"10853" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10853.jpg" +"10854" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10854.jpg" +"10855" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10855.jpg" +"10856" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10856.jpg" +"10857" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10857.jpg" +"10858" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10858.jpg" +"10859" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10859.jpg" +"10860" "Is there a bed in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10860.jpg" +"10861" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10861.jpg" +"10862" "Is there a court in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10862.jpg" +"10863" "Is there a goal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10863.jpg" +"10864" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10864.jpg" +"10865" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10865.jpg" +"10866" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10866.jpg" +"10867" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10867.jpg" +"10868" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10868.jpg" +"10869" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10869.jpg" +"10870" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10870.jpg" +"10871" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10871.jpg" +"10872" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10872.jpg" +"10873" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10873.jpg" +"10874" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10874.jpg" +"10875" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10875.jpg" +"10876" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10876.jpg" +"10877" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10877.jpg" +"10878" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10878.jpg" +"10879" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10879.jpg" +"10880" "Is there a saddle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10880.jpg" +"10881" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10881.jpg" +"10882" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10882.jpg" +"10883" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10883.jpg" +"10884" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10884.jpg" +"10885" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10885.jpg" +"10886" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10886.jpg" +"10887" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10887.jpg" +"10888" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10888.jpg" +"10889" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10889.jpg" +"10890" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10890.jpg" +"10891" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10891.jpg" +"10892" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10892.jpg" +"10893" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10893.jpg" +"10894" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10894.jpg" +"10895" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10895.jpg" +"10896" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10896.jpg" +"10897" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10897.jpg" +"10898" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10898.jpg" +"10899" "Is there a truck in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10899.jpg" +"10900" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10900.jpg" +"10901" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10901.jpg" +"10902" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10902.jpg" +"10903" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10903.jpg" +"10904" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10904.jpg" +"10905" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10905.jpg" +"10906" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10906.jpg" +"10907" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10907.jpg" +"10908" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10908.jpg" +"10909" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10909.jpg" +"10910" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10910.jpg" +"10911" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10911.jpg" +"10912" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10912.jpg" +"10913" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10913.jpg" +"10914" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10914.jpg" +"10915" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10915.jpg" +"10916" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10916.jpg" +"10917" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10917.jpg" +"10918" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10918.jpg" +"10919" "Is there a bag in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10919.jpg" +"10920" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10920.jpg" +"10921" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10921.jpg" +"10922" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10922.jpg" +"10923" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10923.jpg" +"10924" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10924.jpg" +"10925" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10925.jpg" +"10926" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10926.jpg" +"10927" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10927.jpg" +"10928" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10928.jpg" +"10929" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10929.jpg" +"10930" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10930.jpg" +"10931" "Is there a carpet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10931.jpg" +"10932" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10932.jpg" +"10933" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10933.jpg" +"10934" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10934.jpg" +"10935" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10935.jpg" +"10936" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10936.jpg" +"10937" "Is there a rabbit in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10937.jpg" +"10938" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10938.jpg" +"10939" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10939.jpg" +"10940" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10940.jpg" +"10941" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10941.jpg" +"10942" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10942.jpg" +"10943" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10943.jpg" +"10944" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10944.jpg" +"10945" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10945.jpg" +"10946" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10946.jpg" +"10947" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10947.jpg" +"10948" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10948.jpg" +"10949" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10949.jpg" +"10950" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10950.jpg" +"10951" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10951.jpg" +"10952" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10952.jpg" +"10953" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10953.jpg" +"10954" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10954.jpg" +"10955" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10955.jpg" +"10956" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10956.jpg" +"10957" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10957.jpg" +"10958" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10958.jpg" +"10959" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10959.jpg" +"10960" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10960.jpg" +"10961" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10961.jpg" +"10962" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10962.jpg" +"10963" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10963.jpg" +"10964" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10964.jpg" +"10965" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10965.jpg" +"10966" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10966.jpg" +"10967" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10967.jpg" +"10968" "Is there a elephant in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10968.jpg" +"10969" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10969.jpg" +"10970" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10970.jpg" +"10971" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10971.jpg" +"10972" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10972.jpg" +"10973" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10973.jpg" +"10974" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10974.jpg" +"10975" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10975.jpg" +"10976" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10976.jpg" +"10977" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10977.jpg" +"10978" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10978.jpg" +"10979" "Is there a chopsticks in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10979.jpg" +"10980" "Is there a scoon in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10980.jpg" +"10981" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10981.jpg" +"10982" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10982.jpg" +"10983" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10983.jpg" +"10984" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10984.jpg" +"10985" "Is there a luggage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10985.jpg" +"10986" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10986.jpg" +"10987" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10987.jpg" +"10988" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10988.jpg" +"10989" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10989.jpg" +"10990" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10990.jpg" +"10991" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10991.jpg" +"10992" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10992.jpg" +"10993" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10993.jpg" +"10994" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10994.jpg" +"10995" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10995.jpg" +"10996" "Is there a opener in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10996.jpg" +"10997" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10997.jpg" +"10998" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10998.jpg" +"10999" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/10999.jpg" +"11000" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11000.jpg" +"11001" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11001.jpg" +"11002" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11002.jpg" +"11003" "Is there a shell in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11003.jpg" +"11004" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11004.jpg" +"11005" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11005.jpg" +"11006" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11006.jpg" +"11007" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11007.jpg" +"11008" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11008.jpg" +"11009" "Is there a zebra in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11009.jpg" +"11010" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11010.jpg" +"11011" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11011.jpg" +"11012" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11012.jpg" +"11013" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11013.jpg" +"11014" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11014.jpg" +"11015" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11015.jpg" +"11016" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11016.jpg" +"11017" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11017.jpg" +"11018" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11018.jpg" +"11019" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11019.jpg" +"11020" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11020.jpg" +"11021" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11021.jpg" +"11022" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11022.jpg" +"11023" "Is there a buoy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11023.jpg" +"11024" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11024.jpg" +"11025" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11025.jpg" +"11026" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11026.jpg" +"11027" "Is there a bookshelf in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11027.jpg" +"11028" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11028.jpg" +"11029" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11029.jpg" +"11030" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11030.jpg" +"11031" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11031.jpg" +"11032" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11032.jpg" +"11033" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11033.jpg" +"11034" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11034.jpg" +"11035" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11035.jpg" +"11036" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11036.jpg" +"11037" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11037.jpg" +"11038" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11038.jpg" +"11039" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11039.jpg" +"11040" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11040.jpg" +"11041" "Is there a earphone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11041.jpg" +"11042" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11042.jpg" +"11043" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11043.jpg" +"11044" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11044.jpg" +"11045" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11045.jpg" +"11046" "Is there a electrombile in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11046.jpg" +"11047" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11047.jpg" +"11048" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11048.jpg" +"11049" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11049.jpg" +"11050" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11050.jpg" +"11051" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11051.jpg" +"11052" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11052.jpg" +"11053" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11053.jpg" +"11054" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11054.jpg" +"11055" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11055.jpg" +"11056" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11056.jpg" +"11057" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11057.jpg" +"11058" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11058.jpg" +"11059" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11059.jpg" +"11060" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11060.jpg" +"11061" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11061.jpg" +"11062" "Is there a dustbin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11062.jpg" +"11063" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11063.jpg" +"11064" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11064.jpg" +"11065" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11065.jpg" +"11066" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11066.jpg" +"11067" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11067.jpg" +"11068" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11068.jpg" +"11069" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11069.jpg" +"11070" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11070.jpg" +"11071" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11071.jpg" +"11072" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11072.jpg" +"11073" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11073.jpg" +"11074" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11074.jpg" +"11075" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11075.jpg" +"11076" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11076.jpg" +"11077" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11077.jpg" +"11078" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11078.jpg" +"11079" "Is there a ceiling in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11079.jpg" +"11080" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11080.jpg" +"11081" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11081.jpg" +"11082" "Is there a holder in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11082.jpg" +"11083" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11083.jpg" +"11084" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11084.jpg" +"11085" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11085.jpg" +"11086" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11086.jpg" +"11087" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11087.jpg" +"11088" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11088.jpg" +"11089" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11089.jpg" +"11090" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11090.jpg" +"11091" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11091.jpg" +"11092" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11092.jpg" +"11093" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11093.jpg" +"11094" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11094.jpg" +"11095" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11095.jpg" +"11096" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11096.jpg" +"11097" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11097.jpg" +"11098" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11098.jpg" +"11099" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11099.jpg" +"11100" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11100.jpg" +"11101" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11101.jpg" +"11102" "Is there a river in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11102.jpg" +"11103" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11103.jpg" +"11104" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11104.jpg" +"11105" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11105.jpg" +"11106" "Is there a snack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11106.jpg" +"11107" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11107.jpg" +"11108" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11108.jpg" +"11109" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11109.jpg" +"11110" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11110.jpg" +"11111" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11111.jpg" +"11112" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11112.jpg" +"11113" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11113.jpg" +"11114" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11114.jpg" +"11115" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11115.jpg" +"11116" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11116.jpg" +"11117" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11117.jpg" +"11118" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11118.jpg" +"11119" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11119.jpg" +"11120" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11120.jpg" +"11121" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11121.jpg" +"11122" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11122.jpg" +"11123" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11123.jpg" +"11124" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11124.jpg" +"11125" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11125.jpg" +"11126" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11126.jpg" +"11127" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11127.jpg" +"11128" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11128.jpg" +"11129" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11129.jpg" +"11130" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11130.jpg" +"11131" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11131.jpg" +"11132" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11132.jpg" +"11133" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11133.jpg" +"11134" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11134.jpg" +"11135" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11135.jpg" +"11136" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11136.jpg" +"11137" "Is there a coffee in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11137.jpg" +"11138" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11138.jpg" +"11139" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11139.jpg" +"11140" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11140.jpg" +"11141" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11141.jpg" +"11142" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11142.jpg" +"11143" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11143.jpg" +"11144" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11144.jpg" +"11145" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11145.jpg" +"11146" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11146.jpg" +"11147" "Is there a basin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11147.jpg" +"11148" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11148.jpg" +"11149" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11149.jpg" +"11150" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11150.jpg" +"11151" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11151.jpg" +"11152" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11152.jpg" +"11153" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11153.jpg" +"11154" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11154.jpg" +"11155" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11155.jpg" +"11156" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11156.jpg" +"11157" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11157.jpg" +"11158" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11158.jpg" +"11159" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11159.jpg" +"11160" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11160.jpg" +"11161" "Is there a waterfront in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11161.jpg" +"11162" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11162.jpg" +"11163" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11163.jpg" +"11164" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11164.jpg" +"11165" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11165.jpg" +"11166" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11166.jpg" +"11167" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11167.jpg" +"11168" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11168.jpg" +"11169" "Is there a bowl in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11169.jpg" +"11170" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11170.jpg" +"11171" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11171.jpg" +"11172" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11172.jpg" +"11173" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11173.jpg" +"11174" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11174.jpg" +"11175" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11175.jpg" +"11176" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11176.jpg" +"11177" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11177.jpg" +"11178" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11178.jpg" +"11179" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11179.jpg" +"11180" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11180.jpg" +"11181" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11181.jpg" +"11182" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11182.jpg" +"11183" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11183.jpg" +"11184" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11184.jpg" +"11185" "Is there a bus in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11185.jpg" +"11186" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11186.jpg" +"11187" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11187.jpg" +"11188" "Is there a tennis in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11188.jpg" +"11189" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11189.jpg" +"11190" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11190.jpg" +"11191" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11191.jpg" +"11192" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11192.jpg" +"11193" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11193.jpg" +"11194" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11194.jpg" +"11195" "Is there a wire in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11195.jpg" +"11196" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11196.jpg" +"11197" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11197.jpg" +"11198" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11198.jpg" +"11199" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11199.jpg" +"11200" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11200.jpg" +"11201" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11201.jpg" +"11202" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11202.jpg" +"11203" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11203.jpg" +"11204" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11204.jpg" +"11205" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11205.jpg" +"11206" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11206.jpg" +"11207" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11207.jpg" +"11208" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11208.jpg" +"11209" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11209.jpg" +"11210" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11210.jpg" +"11211" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11211.jpg" +"11212" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11212.jpg" +"11213" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11213.jpg" +"11214" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11214.jpg" +"11215" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11215.jpg" +"11216" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11216.jpg" +"11217" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11217.jpg" +"11218" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11218.jpg" +"11219" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11219.jpg" +"11220" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11220.jpg" +"11221" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11221.jpg" +"11222" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11222.jpg" +"11223" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11223.jpg" +"11224" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11224.jpg" +"11225" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11225.jpg" +"11226" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11226.jpg" +"11227" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11227.jpg" +"11228" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11228.jpg" +"11229" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11229.jpg" +"11230" "Is there a dustbin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11230.jpg" +"11231" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11231.jpg" +"11232" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11232.jpg" +"11233" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11233.jpg" +"11234" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11234.jpg" +"11235" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11235.jpg" +"11236" "Is there a insect in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11236.jpg" +"11237" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11237.jpg" +"11238" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11238.jpg" +"11239" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11239.jpg" +"11240" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11240.jpg" +"11241" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11241.jpg" +"11242" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11242.jpg" +"11243" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11243.jpg" +"11244" "Is there a hat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11244.jpg" +"11245" "Is there a dustbin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11245.jpg" +"11246" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11246.jpg" +"11247" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11247.jpg" +"11248" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11248.jpg" +"11249" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11249.jpg" +"11250" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11250.jpg" +"11251" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11251.jpg" +"11252" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11252.jpg" +"11253" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11253.jpg" +"11254" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11254.jpg" +"11255" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11255.jpg" +"11256" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11256.jpg" +"11257" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11257.jpg" +"11258" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11258.jpg" +"11259" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11259.jpg" +"11260" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11260.jpg" +"11261" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11261.jpg" +"11262" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11262.jpg" +"11263" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11263.jpg" +"11264" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11264.jpg" +"11265" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11265.jpg" +"11266" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11266.jpg" +"11267" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11267.jpg" +"11268" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11268.jpg" +"11269" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11269.jpg" +"11270" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11270.jpg" +"11271" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11271.jpg" +"11272" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11272.jpg" +"11273" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11273.jpg" +"11274" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11274.jpg" +"11275" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11275.jpg" +"11276" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11276.jpg" +"11277" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11277.jpg" +"11278" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11278.jpg" +"11279" "Is there a duck in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11279.jpg" +"11280" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11280.jpg" +"11281" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11281.jpg" +"11282" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11282.jpg" +"11283" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11283.jpg" +"11284" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11284.jpg" +"11285" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11285.jpg" +"11286" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11286.jpg" +"11287" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11287.jpg" +"11288" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11288.jpg" +"11289" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11289.jpg" +"11290" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11290.jpg" +"11291" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11291.jpg" +"11292" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11292.jpg" +"11293" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11293.jpg" +"11294" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11294.jpg" +"11295" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11295.jpg" +"11296" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11296.jpg" +"11297" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11297.jpg" +"11298" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11298.jpg" +"11299" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11299.jpg" +"11300" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11300.jpg" +"11301" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11301.jpg" +"11302" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11302.jpg" +"11303" "Is there a zebra in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11303.jpg" +"11304" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11304.jpg" +"11305" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11305.jpg" +"11306" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11306.jpg" +"11307" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11307.jpg" +"11308" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11308.jpg" +"11309" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11309.jpg" +"11310" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11310.jpg" +"11311" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11311.jpg" +"11312" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11312.jpg" +"11313" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11313.jpg" +"11314" "Is there a snowboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11314.jpg" +"11315" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11315.jpg" +"11316" "Is there a apple in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11316.jpg" +"11317" "Is there a tangerine in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11317.jpg" +"11318" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11318.jpg" +"11319" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11319.jpg" +"11320" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11320.jpg" +"11321" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11321.jpg" +"11322" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11322.jpg" +"11323" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11323.jpg" +"11324" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11324.jpg" +"11325" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11325.jpg" +"11326" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11326.jpg" +"11327" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11327.jpg" +"11328" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11328.jpg" +"11329" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11329.jpg" +"11330" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11330.jpg" +"11331" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11331.jpg" +"11332" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11332.jpg" +"11333" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11333.jpg" +"11334" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11334.jpg" +"11335" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11335.jpg" +"11336" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11336.jpg" +"11337" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11337.jpg" +"11338" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11338.jpg" +"11339" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11339.jpg" +"11340" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11340.jpg" +"11341" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11341.jpg" +"11342" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11342.jpg" +"11343" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11343.jpg" +"11344" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11344.jpg" +"11345" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11345.jpg" +"11346" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11346.jpg" +"11347" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11347.jpg" +"11348" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11348.jpg" +"11349" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11349.jpg" +"11350" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11350.jpg" +"11351" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11351.jpg" +"11352" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11352.jpg" +"11353" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11353.jpg" +"11354" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11354.jpg" +"11355" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11355.jpg" +"11356" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11356.jpg" +"11357" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11357.jpg" +"11358" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11358.jpg" +"11359" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11359.jpg" +"11360" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11360.jpg" +"11361" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11361.jpg" +"11362" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11362.jpg" +"11363" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11363.jpg" +"11364" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11364.jpg" +"11365" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11365.jpg" +"11366" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11366.jpg" +"11367" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11367.jpg" +"11368" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11368.jpg" +"11369" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11369.jpg" +"11370" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11370.jpg" +"11371" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11371.jpg" +"11372" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11372.jpg" +"11373" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11373.jpg" +"11374" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11374.jpg" +"11375" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11375.jpg" +"11376" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11376.jpg" +"11377" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11377.jpg" +"11378" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11378.jpg" +"11379" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11379.jpg" +"11380" "Is there a doghole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11380.jpg" +"11381" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11381.jpg" +"11382" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11382.jpg" +"11383" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11383.jpg" +"11384" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11384.jpg" +"11385" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11385.jpg" +"11386" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11386.jpg" +"11387" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11387.jpg" +"11388" "Is there a cooker in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11388.jpg" +"11389" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11389.jpg" +"11390" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11390.jpg" +"11391" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11391.jpg" +"11392" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11392.jpg" +"11393" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11393.jpg" +"11394" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11394.jpg" +"11395" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11395.jpg" +"11396" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11396.jpg" +"11397" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11397.jpg" +"11398" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11398.jpg" +"11399" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11399.jpg" +"11400" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11400.jpg" +"11401" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11401.jpg" +"11402" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11402.jpg" +"11403" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11403.jpg" +"11404" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11404.jpg" +"11405" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11405.jpg" +"11406" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11406.jpg" +"11407" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11407.jpg" +"11408" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11408.jpg" +"11409" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11409.jpg" +"11410" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11410.jpg" +"11411" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11411.jpg" +"11412" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11412.jpg" +"11413" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11413.jpg" +"11414" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11414.jpg" +"11415" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11415.jpg" +"11416" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11416.jpg" +"11417" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11417.jpg" +"11418" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11418.jpg" +"11419" "Is there a zebra in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11419.jpg" +"11420" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11420.jpg" +"11421" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11421.jpg" +"11422" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11422.jpg" +"11423" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11423.jpg" +"11424" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11424.jpg" +"11425" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11425.jpg" +"11426" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11426.jpg" +"11427" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11427.jpg" +"11428" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11428.jpg" +"11429" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11429.jpg" +"11430" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11430.jpg" +"11431" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11431.jpg" +"11432" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11432.jpg" +"11433" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11433.jpg" +"11434" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11434.jpg" +"11435" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11435.jpg" +"11436" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11436.jpg" +"11437" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11437.jpg" +"11438" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11438.jpg" +"11439" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11439.jpg" +"11440" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11440.jpg" +"11441" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11441.jpg" +"11442" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11442.jpg" +"11443" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11443.jpg" +"11444" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11444.jpg" +"11445" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11445.jpg" +"11446" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11446.jpg" +"11447" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11447.jpg" +"11448" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11448.jpg" +"11449" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11449.jpg" +"11450" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11450.jpg" +"11451" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11451.jpg" +"11452" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11452.jpg" +"11453" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11453.jpg" +"11454" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11454.jpg" +"11455" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11455.jpg" +"11456" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11456.jpg" +"11457" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11457.jpg" +"11458" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11458.jpg" +"11459" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11459.jpg" +"11460" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11460.jpg" +"11461" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11461.jpg" +"11462" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11462.jpg" +"11463" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11463.jpg" +"11464" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11464.jpg" +"11465" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11465.jpg" +"11466" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11466.jpg" +"11467" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11467.jpg" +"11468" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11468.jpg" +"11469" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11469.jpg" +"11470" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11470.jpg" +"11471" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11471.jpg" +"11472" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11472.jpg" +"11473" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11473.jpg" +"11474" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11474.jpg" +"11475" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11475.jpg" +"11476" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11476.jpg" +"11477" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11477.jpg" +"11478" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11478.jpg" +"11479" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11479.jpg" +"11480" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11480.jpg" +"11481" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11481.jpg" +"11482" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11482.jpg" +"11483" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11483.jpg" +"11484" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11484.jpg" +"11485" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11485.jpg" +"11486" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11486.jpg" +"11487" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11487.jpg" +"11488" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11488.jpg" +"11489" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11489.jpg" +"11490" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11490.jpg" +"11491" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11491.jpg" +"11492" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11492.jpg" +"11493" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11493.jpg" +"11494" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11494.jpg" +"11495" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11495.jpg" +"11496" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11496.jpg" +"11497" "Is there a monkey in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11497.jpg" +"11498" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11498.jpg" +"11499" "Is there a pot in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11499.jpg" +"11500" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11500.jpg" +"11501" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11501.jpg" +"11502" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11502.jpg" +"11503" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11503.jpg" +"11504" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11504.jpg" +"11505" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11505.jpg" +"11506" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11506.jpg" +"11507" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11507.jpg" +"11508" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11508.jpg" +"11509" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11509.jpg" +"11510" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11510.jpg" +"11511" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11511.jpg" +"11512" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11512.jpg" +"11513" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11513.jpg" +"11514" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11514.jpg" +"11515" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11515.jpg" +"11516" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11516.jpg" +"11517" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11517.jpg" +"11518" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11518.jpg" +"11519" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11519.jpg" +"11520" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11520.jpg" +"11521" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11521.jpg" +"11522" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11522.jpg" +"11523" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11523.jpg" +"11524" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11524.jpg" +"11525" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11525.jpg" +"11526" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11526.jpg" +"11527" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11527.jpg" +"11528" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11528.jpg" +"11529" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11529.jpg" +"11530" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11530.jpg" +"11531" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11531.jpg" +"11532" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11532.jpg" +"11533" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11533.jpg" +"11534" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11534.jpg" +"11535" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11535.jpg" +"11536" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11536.jpg" +"11537" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11537.jpg" +"11538" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11538.jpg" +"11539" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11539.jpg" +"11540" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11540.jpg" +"11541" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11541.jpg" +"11542" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11542.jpg" +"11543" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11543.jpg" +"11544" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11544.jpg" +"11545" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11545.jpg" +"11546" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11546.jpg" +"11547" "Is there a lamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11547.jpg" +"11548" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11548.jpg" +"11549" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11549.jpg" +"11550" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11550.jpg" +"11551" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11551.jpg" +"11552" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11552.jpg" +"11553" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11553.jpg" +"11554" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11554.jpg" +"11555" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11555.jpg" +"11556" "Is there a sled in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11556.jpg" +"11557" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11557.jpg" +"11558" "Is there a shampoo in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11558.jpg" +"11559" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11559.jpg" +"11560" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11560.jpg" +"11561" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11561.jpg" +"11562" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11562.jpg" +"11563" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11563.jpg" +"11564" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11564.jpg" +"11565" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11565.jpg" +"11566" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11566.jpg" +"11567" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11567.jpg" +"11568" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11568.jpg" +"11569" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11569.jpg" +"11570" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11570.jpg" +"11571" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11571.jpg" +"11572" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11572.jpg" +"11573" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11573.jpg" +"11574" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11574.jpg" +"11575" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11575.jpg" +"11576" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11576.jpg" +"11577" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11577.jpg" +"11578" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11578.jpg" +"11579" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11579.jpg" +"11580" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11580.jpg" +"11581" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11581.jpg" +"11582" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11582.jpg" +"11583" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11583.jpg" +"11584" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11584.jpg" +"11585" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11585.jpg" +"11586" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11586.jpg" +"11587" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11587.jpg" +"11588" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11588.jpg" +"11589" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11589.jpg" +"11590" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11590.jpg" +"11591" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11591.jpg" +"11592" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11592.jpg" +"11593" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11593.jpg" +"11594" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11594.jpg" +"11595" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11595.jpg" +"11596" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11596.jpg" +"11597" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11597.jpg" +"11598" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11598.jpg" +"11599" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11599.jpg" +"11600" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11600.jpg" +"11601" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11601.jpg" +"11602" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11602.jpg" +"11603" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11603.jpg" +"11604" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11604.jpg" +"11605" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11605.jpg" +"11606" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11606.jpg" +"11607" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11607.jpg" +"11608" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11608.jpg" +"11609" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11609.jpg" +"11610" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11610.jpg" +"11611" "Is there a tangerine in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11611.jpg" +"11612" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11612.jpg" +"11613" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11613.jpg" +"11614" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11614.jpg" +"11615" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11615.jpg" +"11616" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11616.jpg" +"11617" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11617.jpg" +"11618" "Is there a pinwheel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11618.jpg" +"11619" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11619.jpg" +"11620" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11620.jpg" +"11621" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11621.jpg" +"11622" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11622.jpg" +"11623" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11623.jpg" +"11624" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11624.jpg" +"11625" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11625.jpg" +"11626" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11626.jpg" +"11627" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11627.jpg" +"11628" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11628.jpg" +"11629" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11629.jpg" +"11630" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11630.jpg" +"11631" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11631.jpg" +"11632" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11632.jpg" +"11633" "Is there a bus in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11633.jpg" +"11634" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11634.jpg" +"11635" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11635.jpg" +"11636" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11636.jpg" +"11637" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11637.jpg" +"11638" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11638.jpg" +"11639" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11639.jpg" +"11640" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11640.jpg" +"11641" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11641.jpg" +"11642" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11642.jpg" +"11643" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11643.jpg" +"11644" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11644.jpg" +"11645" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11645.jpg" +"11646" "Is there a keyboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11646.jpg" +"11647" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11647.jpg" +"11648" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11648.jpg" +"11649" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11649.jpg" +"11650" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11650.jpg" +"11651" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11651.jpg" +"11652" "Is there a sanitizer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11652.jpg" +"11653" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11653.jpg" +"11654" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11654.jpg" +"11655" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11655.jpg" +"11656" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11656.jpg" +"11657" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11657.jpg" +"11658" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11658.jpg" +"11659" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11659.jpg" +"11660" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11660.jpg" +"11661" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11661.jpg" +"11662" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11662.jpg" +"11663" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11663.jpg" +"11664" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11664.jpg" +"11665" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11665.jpg" +"11666" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11666.jpg" +"11667" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11667.jpg" +"11668" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11668.jpg" +"11669" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11669.jpg" +"11670" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11670.jpg" +"11671" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11671.jpg" +"11672" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11672.jpg" +"11673" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11673.jpg" +"11674" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11674.jpg" +"11675" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11675.jpg" +"11676" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11676.jpg" +"11677" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11677.jpg" +"11678" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11678.jpg" +"11679" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11679.jpg" +"11680" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11680.jpg" +"11681" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11681.jpg" +"11682" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11682.jpg" +"11683" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11683.jpg" +"11684" "Is there a bridge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11684.jpg" +"11685" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11685.jpg" +"11686" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11686.jpg" +"11687" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11687.jpg" +"11688" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11688.jpg" +"11689" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11689.jpg" +"11690" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11690.jpg" +"11691" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11691.jpg" +"11692" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11692.jpg" +"11693" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11693.jpg" +"11694" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11694.jpg" +"11695" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11695.jpg" +"11696" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11696.jpg" +"11697" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11697.jpg" +"11698" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11698.jpg" +"11699" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11699.jpg" +"11700" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11700.jpg" +"11701" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11701.jpg" +"11702" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11702.jpg" +"11703" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11703.jpg" +"11704" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11704.jpg" +"11705" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11705.jpg" +"11706" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11706.jpg" +"11707" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11707.jpg" +"11708" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11708.jpg" +"11709" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11709.jpg" +"11710" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11710.jpg" +"11711" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11711.jpg" +"11712" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11712.jpg" +"11713" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11713.jpg" +"11714" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11714.jpg" +"11715" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11715.jpg" +"11716" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11716.jpg" +"11717" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11717.jpg" +"11718" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11718.jpg" +"11719" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11719.jpg" +"11720" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11720.jpg" +"11721" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11721.jpg" +"11722" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11722.jpg" +"11723" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11723.jpg" +"11724" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11724.jpg" +"11725" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11725.jpg" +"11726" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11726.jpg" +"11727" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11727.jpg" +"11728" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11728.jpg" +"11729" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11729.jpg" +"11730" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11730.jpg" +"11731" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11731.jpg" +"11732" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11732.jpg" +"11733" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11733.jpg" +"11734" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11734.jpg" +"11735" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11735.jpg" +"11736" "Is there a monitor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11736.jpg" +"11737" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11737.jpg" +"11738" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11738.jpg" +"11739" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11739.jpg" +"11740" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11740.jpg" +"11741" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11741.jpg" +"11742" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11742.jpg" +"11743" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11743.jpg" +"11744" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11744.jpg" +"11745" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11745.jpg" +"11746" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11746.jpg" +"11747" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11747.jpg" +"11748" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11748.jpg" +"11749" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11749.jpg" +"11750" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11750.jpg" +"11751" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11751.jpg" +"11752" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11752.jpg" +"11753" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11753.jpg" +"11754" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11754.jpg" +"11755" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11755.jpg" +"11756" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11756.jpg" +"11757" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11757.jpg" +"11758" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11758.jpg" +"11759" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11759.jpg" +"11760" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11760.jpg" +"11761" "Is there a bowl in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11761.jpg" +"11762" "Is there a chopsticks in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11762.jpg" +"11763" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11763.jpg" +"11764" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11764.jpg" +"11765" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11765.jpg" +"11766" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11766.jpg" +"11767" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11767.jpg" +"11768" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11768.jpg" +"11769" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11769.jpg" +"11770" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11770.jpg" +"11771" "Is there a doghole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11771.jpg" +"11772" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11772.jpg" +"11773" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11773.jpg" +"11774" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11774.jpg" +"11775" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11775.jpg" +"11776" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11776.jpg" +"11777" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11777.jpg" +"11778" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11778.jpg" +"11779" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11779.jpg" +"11780" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11780.jpg" +"11781" "Is there a luggage in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11781.jpg" +"11782" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11782.jpg" +"11783" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11783.jpg" +"11784" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11784.jpg" +"11785" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11785.jpg" +"11786" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11786.jpg" +"11787" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11787.jpg" +"11788" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11788.jpg" +"11789" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11789.jpg" +"11790" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11790.jpg" +"11791" "Is there a train in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11791.jpg" +"11792" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11792.jpg" +"11793" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11793.jpg" +"11794" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11794.jpg" +"11795" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11795.jpg" +"11796" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11796.jpg" +"11797" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11797.jpg" +"11798" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11798.jpg" +"11799" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11799.jpg" +"11800" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11800.jpg" +"11801" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11801.jpg" +"11802" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11802.jpg" +"11803" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11803.jpg" +"11804" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11804.jpg" +"11805" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11805.jpg" +"11806" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11806.jpg" +"11807" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11807.jpg" +"11808" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11808.jpg" +"11809" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11809.jpg" +"11810" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11810.jpg" +"11811" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11811.jpg" +"11812" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11812.jpg" +"11813" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11813.jpg" +"11814" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11814.jpg" +"11815" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11815.jpg" +"11816" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11816.jpg" +"11817" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11817.jpg" +"11818" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11818.jpg" +"11819" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11819.jpg" +"11820" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11820.jpg" +"11821" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11821.jpg" +"11822" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11822.jpg" +"11823" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11823.jpg" +"11824" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11824.jpg" +"11825" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11825.jpg" +"11826" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11826.jpg" +"11827" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11827.jpg" +"11828" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11828.jpg" +"11829" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11829.jpg" +"11830" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11830.jpg" +"11831" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11831.jpg" +"11832" "Is there a plane in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11832.jpg" +"11833" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11833.jpg" +"11834" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11834.jpg" +"11835" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11835.jpg" +"11836" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11836.jpg" +"11837" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11837.jpg" +"11838" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11838.jpg" +"11839" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11839.jpg" +"11840" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11840.jpg" +"11841" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11841.jpg" +"11842" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11842.jpg" +"11843" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11843.jpg" +"11844" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11844.jpg" +"11845" "Is there a doghole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11845.jpg" +"11846" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11846.jpg" +"11847" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11847.jpg" +"11848" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11848.jpg" +"11849" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11849.jpg" +"11850" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11850.jpg" +"11851" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11851.jpg" +"11852" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11852.jpg" +"11853" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11853.jpg" +"11854" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11854.jpg" +"11855" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11855.jpg" +"11856" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11856.jpg" +"11857" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11857.jpg" +"11858" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11858.jpg" +"11859" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11859.jpg" +"11860" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11860.jpg" +"11861" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11861.jpg" +"11862" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11862.jpg" +"11863" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11863.jpg" +"11864" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11864.jpg" +"11865" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11865.jpg" +"11866" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11866.jpg" +"11867" "Is there a reef in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11867.jpg" +"11868" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11868.jpg" +"11869" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11869.jpg" +"11870" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11870.jpg" +"11871" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11871.jpg" +"11872" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11872.jpg" +"11873" "Is there a building in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11873.jpg" +"11874" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11874.jpg" +"11875" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11875.jpg" +"11876" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11876.jpg" +"11877" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11877.jpg" +"11878" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11878.jpg" +"11879" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11879.jpg" +"11880" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11880.jpg" +"11881" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11881.jpg" +"11882" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11882.jpg" +"11883" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11883.jpg" +"11884" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11884.jpg" +"11885" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11885.jpg" +"11886" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11886.jpg" +"11887" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11887.jpg" +"11888" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11888.jpg" +"11889" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11889.jpg" +"11890" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11890.jpg" +"11891" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11891.jpg" +"11892" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11892.jpg" +"11893" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11893.jpg" +"11894" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11894.jpg" +"11895" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11895.jpg" +"11896" "Is there a juicer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11896.jpg" +"11897" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11897.jpg" +"11898" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11898.jpg" +"11899" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11899.jpg" +"11900" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11900.jpg" +"11901" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11901.jpg" +"11902" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11902.jpg" +"11903" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11903.jpg" +"11904" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11904.jpg" +"11905" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11905.jpg" +"11906" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11906.jpg" +"11907" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11907.jpg" +"11908" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11908.jpg" +"11909" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11909.jpg" +"11910" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11910.jpg" +"11911" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11911.jpg" +"11912" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11912.jpg" +"11913" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11913.jpg" +"11914" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11914.jpg" +"11915" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11915.jpg" +"11916" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11916.jpg" +"11917" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11917.jpg" +"11918" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11918.jpg" +"11919" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11919.jpg" +"11920" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11920.jpg" +"11921" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11921.jpg" +"11922" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11922.jpg" +"11923" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11923.jpg" +"11924" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11924.jpg" +"11925" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11925.jpg" +"11926" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11926.jpg" +"11927" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11927.jpg" +"11928" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11928.jpg" +"11929" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11929.jpg" +"11930" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11930.jpg" +"11931" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11931.jpg" +"11932" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11932.jpg" +"11933" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11933.jpg" +"11934" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11934.jpg" +"11935" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11935.jpg" +"11936" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11936.jpg" +"11937" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11937.jpg" +"11938" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11938.jpg" +"11939" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11939.jpg" +"11940" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11940.jpg" +"11941" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11941.jpg" +"11942" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11942.jpg" +"11943" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11943.jpg" +"11944" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11944.jpg" +"11945" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11945.jpg" +"11946" "Is there a shampoo in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11946.jpg" +"11947" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11947.jpg" +"11948" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11948.jpg" +"11949" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11949.jpg" +"11950" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11950.jpg" +"11951" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11951.jpg" +"11952" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11952.jpg" +"11953" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11953.jpg" +"11954" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11954.jpg" +"11955" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11955.jpg" +"11956" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11956.jpg" +"11957" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11957.jpg" +"11958" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11958.jpg" +"11959" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11959.jpg" +"11960" "Is there a bath in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11960.jpg" +"11961" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11961.jpg" +"11962" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11962.jpg" +"11963" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11963.jpg" +"11964" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11964.jpg" +"11965" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11965.jpg" +"11966" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11966.jpg" +"11967" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11967.jpg" +"11968" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11968.jpg" +"11969" "Is there a milk in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11969.jpg" +"11970" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11970.jpg" +"11971" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11971.jpg" +"11972" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11972.jpg" +"11973" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11973.jpg" +"11974" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11974.jpg" +"11975" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11975.jpg" +"11976" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11976.jpg" +"11977" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11977.jpg" +"11978" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11978.jpg" +"11979" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11979.jpg" +"11980" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11980.jpg" +"11981" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11981.jpg" +"11982" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11982.jpg" +"11983" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11983.jpg" +"11984" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11984.jpg" +"11985" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11985.jpg" +"11986" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11986.jpg" +"11987" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11987.jpg" +"11988" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11988.jpg" +"11989" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11989.jpg" +"11990" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11990.jpg" +"11991" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11991.jpg" +"11992" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11992.jpg" +"11993" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11993.jpg" +"11994" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11994.jpg" +"11995" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11995.jpg" +"11996" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11996.jpg" +"11997" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11997.jpg" +"11998" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11998.jpg" +"11999" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/11999.jpg" +"12000" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12000.jpg" +"12001" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12001.jpg" +"12002" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12002.jpg" +"12003" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12003.jpg" +"12004" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12004.jpg" +"12005" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12005.jpg" +"12006" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12006.jpg" +"12007" "Is there a wire in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12007.jpg" +"12008" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12008.jpg" +"12009" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12009.jpg" +"12010" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12010.jpg" +"12011" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12011.jpg" +"12012" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12012.jpg" +"12013" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12013.jpg" +"12014" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12014.jpg" +"12015" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12015.jpg" +"12016" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12016.jpg" +"12017" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12017.jpg" +"12018" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12018.jpg" +"12019" "Is there a monitor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12019.jpg" +"12020" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12020.jpg" +"12021" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12021.jpg" +"12022" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12022.jpg" +"12023" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12023.jpg" +"12024" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12024.jpg" +"12025" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12025.jpg" +"12026" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12026.jpg" +"12027" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12027.jpg" +"12028" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12028.jpg" +"12029" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12029.jpg" +"12030" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12030.jpg" +"12031" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12031.jpg" +"12032" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12032.jpg" +"12033" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12033.jpg" +"12034" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12034.jpg" +"12035" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12035.jpg" +"12036" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12036.jpg" +"12037" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12037.jpg" +"12038" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12038.jpg" +"12039" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12039.jpg" +"12040" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12040.jpg" +"12041" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12041.jpg" +"12042" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12042.jpg" +"12043" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12043.jpg" +"12044" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12044.jpg" +"12045" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12045.jpg" +"12046" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12046.jpg" +"12047" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12047.jpg" +"12048" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12048.jpg" +"12049" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12049.jpg" +"12050" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12050.jpg" +"12051" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12051.jpg" +"12052" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12052.jpg" +"12053" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12053.jpg" +"12054" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12054.jpg" +"12055" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12055.jpg" +"12056" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12056.jpg" +"12057" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12057.jpg" +"12058" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12058.jpg" +"12059" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12059.jpg" +"12060" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12060.jpg" +"12061" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12061.jpg" +"12062" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12062.jpg" +"12063" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12063.jpg" +"12064" "Is there a mirror in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12064.jpg" +"12065" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12065.jpg" +"12066" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12066.jpg" +"12067" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12067.jpg" +"12068" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12068.jpg" +"12069" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12069.jpg" +"12070" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12070.jpg" +"12071" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12071.jpg" +"12072" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12072.jpg" +"12073" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12073.jpg" +"12074" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12074.jpg" +"12075" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12075.jpg" +"12076" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12076.jpg" +"12077" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12077.jpg" +"12078" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12078.jpg" +"12079" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12079.jpg" +"12080" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12080.jpg" +"12081" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12081.jpg" +"12082" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12082.jpg" +"12083" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12083.jpg" +"12084" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12084.jpg" +"12085" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12085.jpg" +"12086" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12086.jpg" +"12087" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12087.jpg" +"12088" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12088.jpg" +"12089" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12089.jpg" +"12090" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12090.jpg" +"12091" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12091.jpg" +"12092" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12092.jpg" +"12093" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12093.jpg" +"12094" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12094.jpg" +"12095" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12095.jpg" +"12096" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12096.jpg" +"12097" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12097.jpg" +"12098" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12098.jpg" +"12099" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12099.jpg" +"12100" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12100.jpg" +"12101" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12101.jpg" +"12102" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12102.jpg" +"12103" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12103.jpg" +"12104" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12104.jpg" +"12105" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12105.jpg" +"12106" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12106.jpg" +"12107" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12107.jpg" +"12108" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12108.jpg" +"12109" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12109.jpg" +"12110" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12110.jpg" +"12111" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12111.jpg" +"12112" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12112.jpg" +"12113" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12113.jpg" +"12114" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12114.jpg" +"12115" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12115.jpg" +"12116" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12116.jpg" +"12117" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12117.jpg" +"12118" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12118.jpg" +"12119" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12119.jpg" +"12120" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12120.jpg" +"12121" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12121.jpg" +"12122" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12122.jpg" +"12123" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12123.jpg" +"12124" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12124.jpg" +"12125" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12125.jpg" +"12126" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12126.jpg" +"12127" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12127.jpg" +"12128" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12128.jpg" +"12129" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12129.jpg" +"12130" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12130.jpg" +"12131" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12131.jpg" +"12132" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12132.jpg" +"12133" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12133.jpg" +"12134" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12134.jpg" +"12135" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12135.jpg" +"12136" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12136.jpg" +"12137" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12137.jpg" +"12138" "Is there a net in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12138.jpg" +"12139" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12139.jpg" +"12140" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12140.jpg" +"12141" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12141.jpg" +"12142" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12142.jpg" +"12143" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12143.jpg" +"12144" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12144.jpg" +"12145" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12145.jpg" +"12146" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12146.jpg" +"12147" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12147.jpg" +"12148" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12148.jpg" +"12149" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12149.jpg" +"12150" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12150.jpg" +"12151" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12151.jpg" +"12152" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12152.jpg" +"12153" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12153.jpg" +"12154" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12154.jpg" +"12155" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12155.jpg" +"12156" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12156.jpg" +"12157" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12157.jpg" +"12158" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12158.jpg" +"12159" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12159.jpg" +"12160" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12160.jpg" +"12161" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12161.jpg" +"12162" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12162.jpg" +"12163" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12163.jpg" +"12164" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12164.jpg" +"12165" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12165.jpg" +"12166" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12166.jpg" +"12167" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12167.jpg" +"12168" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12168.jpg" +"12169" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12169.jpg" +"12170" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12170.jpg" +"12171" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12171.jpg" +"12172" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12172.jpg" +"12173" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12173.jpg" +"12174" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12174.jpg" +"12175" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12175.jpg" +"12176" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12176.jpg" +"12177" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12177.jpg" +"12178" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12178.jpg" +"12179" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12179.jpg" +"12180" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12180.jpg" +"12181" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12181.jpg" +"12182" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12182.jpg" +"12183" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12183.jpg" +"12184" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12184.jpg" +"12185" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12185.jpg" +"12186" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12186.jpg" +"12187" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12187.jpg" +"12188" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12188.jpg" +"12189" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12189.jpg" +"12190" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12190.jpg" +"12191" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12191.jpg" +"12192" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12192.jpg" +"12193" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12193.jpg" +"12194" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12194.jpg" +"12195" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12195.jpg" +"12196" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12196.jpg" +"12197" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12197.jpg" +"12198" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12198.jpg" +"12199" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12199.jpg" +"12200" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12200.jpg" +"12201" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12201.jpg" +"12202" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12202.jpg" +"12203" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12203.jpg" +"12204" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12204.jpg" +"12205" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12205.jpg" +"12206" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12206.jpg" +"12207" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12207.jpg" +"12208" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12208.jpg" +"12209" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12209.jpg" +"12210" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12210.jpg" +"12211" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12211.jpg" +"12212" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12212.jpg" +"12213" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12213.jpg" +"12214" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12214.jpg" +"12215" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12215.jpg" +"12216" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12216.jpg" +"12217" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12217.jpg" +"12218" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12218.jpg" +"12219" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12219.jpg" +"12220" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12220.jpg" +"12221" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12221.jpg" +"12222" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12222.jpg" +"12223" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12223.jpg" +"12224" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12224.jpg" +"12225" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12225.jpg" +"12226" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12226.jpg" +"12227" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12227.jpg" +"12228" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12228.jpg" +"12229" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12229.jpg" +"12230" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12230.jpg" +"12231" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12231.jpg" +"12232" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12232.jpg" +"12233" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12233.jpg" +"12234" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12234.jpg" +"12235" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12235.jpg" +"12236" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12236.jpg" +"12237" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12237.jpg" +"12238" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12238.jpg" +"12239" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12239.jpg" +"12240" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12240.jpg" +"12241" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12241.jpg" +"12242" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12242.jpg" +"12243" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12243.jpg" +"12244" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12244.jpg" +"12245" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12245.jpg" +"12246" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12246.jpg" +"12247" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12247.jpg" +"12248" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12248.jpg" +"12249" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12249.jpg" +"12250" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12250.jpg" +"12251" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12251.jpg" +"12252" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12252.jpg" +"12253" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12253.jpg" +"12254" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12254.jpg" +"12255" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12255.jpg" +"12256" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12256.jpg" +"12257" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12257.jpg" +"12258" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12258.jpg" +"12259" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12259.jpg" +"12260" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12260.jpg" +"12261" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12261.jpg" +"12262" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12262.jpg" +"12263" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12263.jpg" +"12264" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12264.jpg" +"12265" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12265.jpg" +"12266" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12266.jpg" +"12267" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12267.jpg" +"12268" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12268.jpg" +"12269" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12269.jpg" +"12270" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12270.jpg" +"12271" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12271.jpg" +"12272" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12272.jpg" +"12273" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12273.jpg" +"12274" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12274.jpg" +"12275" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12275.jpg" +"12276" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12276.jpg" +"12277" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12277.jpg" +"12278" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12278.jpg" +"12279" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12279.jpg" +"12280" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12280.jpg" +"12281" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12281.jpg" +"12282" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12282.jpg" +"12283" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12283.jpg" +"12284" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12284.jpg" +"12285" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12285.jpg" +"12286" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12286.jpg" +"12287" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12287.jpg" +"12288" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12288.jpg" +"12289" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12289.jpg" +"12290" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12290.jpg" +"12291" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12291.jpg" +"12292" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12292.jpg" +"12293" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12293.jpg" +"12294" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12294.jpg" +"12295" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12295.jpg" +"12296" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12296.jpg" +"12297" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12297.jpg" +"12298" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12298.jpg" +"12299" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12299.jpg" +"12300" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12300.jpg" +"12301" "Is there a coffee in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12301.jpg" +"12302" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12302.jpg" +"12303" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12303.jpg" +"12304" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12304.jpg" +"12305" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12305.jpg" +"12306" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12306.jpg" +"12307" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12307.jpg" +"12308" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12308.jpg" +"12309" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12309.jpg" +"12310" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12310.jpg" +"12311" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12311.jpg" +"12312" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12312.jpg" +"12313" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12313.jpg" +"12314" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12314.jpg" +"12315" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12315.jpg" +"12316" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12316.jpg" +"12317" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12317.jpg" +"12318" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12318.jpg" +"12319" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12319.jpg" +"12320" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12320.jpg" +"12321" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12321.jpg" +"12322" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12322.jpg" +"12323" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12323.jpg" +"12324" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12324.jpg" +"12325" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12325.jpg" +"12326" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12326.jpg" +"12327" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12327.jpg" +"12328" "Is there a signal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12328.jpg" +"12329" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12329.jpg" +"12330" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12330.jpg" +"12331" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12331.jpg" +"12332" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12332.jpg" +"12333" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12333.jpg" +"12334" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12334.jpg" +"12335" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12335.jpg" +"12336" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12336.jpg" +"12337" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12337.jpg" +"12338" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12338.jpg" +"12339" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12339.jpg" +"12340" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12340.jpg" +"12341" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12341.jpg" +"12342" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12342.jpg" +"12343" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12343.jpg" +"12344" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12344.jpg" +"12345" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12345.jpg" +"12346" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12346.jpg" +"12347" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12347.jpg" +"12348" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12348.jpg" +"12349" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12349.jpg" +"12350" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12350.jpg" +"12351" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12351.jpg" +"12352" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12352.jpg" +"12353" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12353.jpg" +"12354" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12354.jpg" +"12355" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12355.jpg" +"12356" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12356.jpg" +"12357" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12357.jpg" +"12358" "Is there a camera in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12358.jpg" +"12359" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12359.jpg" +"12360" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12360.jpg" +"12361" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12361.jpg" +"12362" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12362.jpg" +"12363" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12363.jpg" +"12364" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12364.jpg" +"12365" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12365.jpg" +"12366" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12366.jpg" +"12367" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12367.jpg" +"12368" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12368.jpg" +"12369" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12369.jpg" +"12370" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12370.jpg" +"12371" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12371.jpg" +"12372" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12372.jpg" +"12373" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12373.jpg" +"12374" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12374.jpg" +"12375" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12375.jpg" +"12376" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12376.jpg" +"12377" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12377.jpg" +"12378" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12378.jpg" +"12379" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12379.jpg" +"12380" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12380.jpg" +"12381" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12381.jpg" +"12382" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12382.jpg" +"12383" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12383.jpg" +"12384" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12384.jpg" +"12385" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12385.jpg" +"12386" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12386.jpg" +"12387" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12387.jpg" +"12388" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12388.jpg" +"12389" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12389.jpg" +"12390" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12390.jpg" +"12391" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12391.jpg" +"12392" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12392.jpg" +"12393" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12393.jpg" +"12394" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12394.jpg" +"12395" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12395.jpg" +"12396" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12396.jpg" +"12397" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12397.jpg" +"12398" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12398.jpg" +"12399" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12399.jpg" +"12400" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12400.jpg" +"12401" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12401.jpg" +"12402" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12402.jpg" +"12403" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12403.jpg" +"12404" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12404.jpg" +"12405" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12405.jpg" +"12406" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12406.jpg" +"12407" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12407.jpg" +"12408" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12408.jpg" +"12409" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12409.jpg" +"12410" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12410.jpg" +"12411" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12411.jpg" +"12412" "Is there a goose in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12412.jpg" +"12413" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12413.jpg" +"12414" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12414.jpg" +"12415" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12415.jpg" +"12416" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12416.jpg" +"12417" "Is there a signal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12417.jpg" +"12418" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12418.jpg" +"12419" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12419.jpg" +"12420" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12420.jpg" +"12421" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12421.jpg" +"12422" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12422.jpg" +"12423" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12423.jpg" +"12424" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12424.jpg" +"12425" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12425.jpg" +"12426" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12426.jpg" +"12427" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12427.jpg" +"12428" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12428.jpg" +"12429" "Is there a glass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12429.jpg" +"12430" "Is there a watch in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12430.jpg" +"12431" "Is there a hat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12431.jpg" +"12432" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12432.jpg" +"12433" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12433.jpg" +"12434" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12434.jpg" +"12435" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12435.jpg" +"12436" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12436.jpg" +"12437" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12437.jpg" +"12438" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12438.jpg" +"12439" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12439.jpg" +"12440" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12440.jpg" +"12441" "Is there a ball in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12441.jpg" +"12442" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12442.jpg" +"12443" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12443.jpg" +"12444" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12444.jpg" +"12445" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12445.jpg" +"12446" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12446.jpg" +"12447" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12447.jpg" +"12448" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12448.jpg" +"12449" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12449.jpg" +"12450" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12450.jpg" +"12451" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12451.jpg" +"12452" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12452.jpg" +"12453" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12453.jpg" +"12454" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12454.jpg" +"12455" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12455.jpg" +"12456" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12456.jpg" +"12457" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12457.jpg" +"12458" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12458.jpg" +"12459" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12459.jpg" +"12460" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12460.jpg" +"12461" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12461.jpg" +"12462" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12462.jpg" +"12463" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12463.jpg" +"12464" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12464.jpg" +"12465" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12465.jpg" +"12466" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12466.jpg" +"12467" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12467.jpg" +"12468" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12468.jpg" +"12469" "Is there a snow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12469.jpg" +"12470" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12470.jpg" +"12471" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12471.jpg" +"12472" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12472.jpg" +"12473" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12473.jpg" +"12474" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12474.jpg" +"12475" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12475.jpg" +"12476" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12476.jpg" +"12477" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12477.jpg" +"12478" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12478.jpg" +"12479" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12479.jpg" +"12480" "Is there a backpack in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12480.jpg" +"12481" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12481.jpg" +"12482" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12482.jpg" +"12483" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12483.jpg" +"12484" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12484.jpg" +"12485" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12485.jpg" +"12486" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12486.jpg" +"12487" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12487.jpg" +"12488" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12488.jpg" +"12489" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12489.jpg" +"12490" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12490.jpg" +"12491" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12491.jpg" +"12492" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12492.jpg" +"12493" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12493.jpg" +"12494" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12494.jpg" +"12495" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12495.jpg" +"12496" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12496.jpg" +"12497" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12497.jpg" +"12498" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12498.jpg" +"12499" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12499.jpg" +"12500" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12500.jpg" +"12501" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12501.jpg" +"12502" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12502.jpg" +"12503" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12503.jpg" +"12504" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12504.jpg" +"12505" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12505.jpg" +"12506" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12506.jpg" +"12507" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12507.jpg" +"12508" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12508.jpg" +"12509" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12509.jpg" +"12510" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12510.jpg" +"12511" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12511.jpg" +"12512" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12512.jpg" +"12513" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12513.jpg" +"12514" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12514.jpg" +"12515" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12515.jpg" +"12516" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12516.jpg" +"12517" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12517.jpg" +"12518" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12518.jpg" +"12519" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12519.jpg" +"12520" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12520.jpg" +"12521" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12521.jpg" +"12522" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12522.jpg" +"12523" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12523.jpg" +"12524" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12524.jpg" +"12525" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12525.jpg" +"12526" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12526.jpg" +"12527" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12527.jpg" +"12528" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12528.jpg" +"12529" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12529.jpg" +"12530" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12530.jpg" +"12531" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12531.jpg" +"12532" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12532.jpg" +"12533" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12533.jpg" +"12534" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12534.jpg" +"12535" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12535.jpg" +"12536" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12536.jpg" +"12537" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12537.jpg" +"12538" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12538.jpg" +"12539" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12539.jpg" +"12540" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12540.jpg" +"12541" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12541.jpg" +"12542" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12542.jpg" +"12543" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12543.jpg" +"12544" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12544.jpg" +"12545" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12545.jpg" +"12546" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12546.jpg" +"12547" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12547.jpg" +"12548" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12548.jpg" +"12549" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12549.jpg" +"12550" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12550.jpg" +"12551" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12551.jpg" +"12552" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12552.jpg" +"12553" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12553.jpg" +"12554" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12554.jpg" +"12555" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12555.jpg" +"12556" "Is there a controller in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12556.jpg" +"12557" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12557.jpg" +"12558" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12558.jpg" +"12559" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12559.jpg" +"12560" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12560.jpg" +"12561" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12561.jpg" +"12562" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12562.jpg" +"12563" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12563.jpg" +"12564" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12564.jpg" +"12565" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12565.jpg" +"12566" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12566.jpg" +"12567" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12567.jpg" +"12568" "Is there a man in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12568.jpg" +"12569" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12569.jpg" +"12570" "Is there a airport in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12570.jpg" +"12571" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12571.jpg" +"12572" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12572.jpg" +"12573" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12573.jpg" +"12574" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12574.jpg" +"12575" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12575.jpg" +"12576" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12576.jpg" +"12577" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12577.jpg" +"12578" "Is there a woman in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12578.jpg" +"12579" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12579.jpg" +"12580" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12580.jpg" +"12581" "Is there a controller in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12581.jpg" +"12582" "Is there a child in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12582.jpg" +"12583" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12583.jpg" +"12584" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12584.jpg" +"12585" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12585.jpg" +"12586" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12586.jpg" +"12587" "Is there a bath in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12587.jpg" +"12588" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12588.jpg" +"12589" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12589.jpg" +"12590" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12590.jpg" +"12591" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12591.jpg" +"12592" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12592.jpg" +"12593" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12593.jpg" +"12594" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12594.jpg" +"12595" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12595.jpg" +"12596" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12596.jpg" +"12597" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12597.jpg" +"12598" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12598.jpg" +"12599" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12599.jpg" +"12600" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12600.jpg" +"12601" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12601.jpg" +"12602" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12602.jpg" +"12603" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12603.jpg" +"12604" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12604.jpg" +"12605" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12605.jpg" +"12606" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12606.jpg" +"12607" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12607.jpg" +"12608" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12608.jpg" +"12609" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12609.jpg" +"12610" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12610.jpg" +"12611" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12611.jpg" +"12612" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12612.jpg" +"12613" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12613.jpg" +"12614" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12614.jpg" +"12615" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12615.jpg" +"12616" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12616.jpg" +"12617" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12617.jpg" +"12618" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12618.jpg" +"12619" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12619.jpg" +"12620" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12620.jpg" +"12621" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12621.jpg" +"12622" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12622.jpg" +"12623" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12623.jpg" +"12624" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12624.jpg" +"12625" "Is there a paddle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12625.jpg" +"12626" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12626.jpg" +"12627" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12627.jpg" +"12628" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12628.jpg" +"12629" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12629.jpg" +"12630" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12630.jpg" +"12631" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12631.jpg" +"12632" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12632.jpg" +"12633" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12633.jpg" +"12634" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12634.jpg" +"12635" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12635.jpg" +"12636" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12636.jpg" +"12637" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12637.jpg" +"12638" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12638.jpg" +"12639" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12639.jpg" +"12640" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12640.jpg" +"12641" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12641.jpg" +"12642" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12642.jpg" +"12643" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12643.jpg" +"12644" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12644.jpg" +"12645" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12645.jpg" +"12646" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12646.jpg" +"12647" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12647.jpg" +"12648" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12648.jpg" +"12649" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12649.jpg" +"12650" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12650.jpg" +"12651" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12651.jpg" +"12652" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12652.jpg" +"12653" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12653.jpg" +"12654" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12654.jpg" +"12655" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12655.jpg" +"12656" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12656.jpg" +"12657" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12657.jpg" +"12658" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12658.jpg" +"12659" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12659.jpg" +"12660" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12660.jpg" +"12661" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12661.jpg" +"12662" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12662.jpg" +"12663" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12663.jpg" +"12664" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12664.jpg" +"12665" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12665.jpg" +"12666" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12666.jpg" +"12667" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12667.jpg" +"12668" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12668.jpg" +"12669" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12669.jpg" +"12670" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12670.jpg" +"12671" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12671.jpg" +"12672" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12672.jpg" +"12673" "Is there a cathole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12673.jpg" +"12674" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12674.jpg" +"12675" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12675.jpg" +"12676" "Is there a controller in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12676.jpg" +"12677" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12677.jpg" +"12678" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12678.jpg" +"12679" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12679.jpg" +"12680" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12680.jpg" +"12681" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12681.jpg" +"12682" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12682.jpg" +"12683" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12683.jpg" +"12684" "Is there a controller in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12684.jpg" +"12685" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12685.jpg" +"12686" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12686.jpg" +"12687" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12687.jpg" +"12688" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12688.jpg" +"12689" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12689.jpg" +"12690" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12690.jpg" +"12691" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12691.jpg" +"12692" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12692.jpg" +"12693" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12693.jpg" +"12694" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12694.jpg" +"12695" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12695.jpg" +"12696" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12696.jpg" +"12697" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12697.jpg" +"12698" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12698.jpg" +"12699" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12699.jpg" +"12700" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12700.jpg" +"12701" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12701.jpg" +"12702" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12702.jpg" +"12703" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12703.jpg" +"12704" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12704.jpg" +"12705" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12705.jpg" +"12706" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12706.jpg" +"12707" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12707.jpg" +"12708" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12708.jpg" +"12709" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12709.jpg" +"12710" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12710.jpg" +"12711" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12711.jpg" +"12712" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12712.jpg" +"12713" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12713.jpg" +"12714" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12714.jpg" +"12715" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12715.jpg" +"12716" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12716.jpg" +"12717" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12717.jpg" +"12718" "Is there a horse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12718.jpg" +"12719" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12719.jpg" +"12720" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12720.jpg" +"12721" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12721.jpg" +"12722" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12722.jpg" +"12723" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12723.jpg" +"12724" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12724.jpg" +"12725" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12725.jpg" +"12726" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12726.jpg" +"12727" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12727.jpg" +"12728" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12728.jpg" +"12729" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12729.jpg" +"12730" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12730.jpg" +"12731" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12731.jpg" +"12732" "Is there a camel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12732.jpg" +"12733" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12733.jpg" +"12734" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12734.jpg" +"12735" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12735.jpg" +"12736" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12736.jpg" +"12737" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12737.jpg" +"12738" "Is there a pen in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12738.jpg" +"12739" "Is there a plane in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12739.jpg" +"12740" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12740.jpg" +"12741" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12741.jpg" +"12742" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12742.jpg" +"12743" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12743.jpg" +"12744" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12744.jpg" +"12745" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12745.jpg" +"12746" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12746.jpg" +"12747" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12747.jpg" +"12748" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12748.jpg" +"12749" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12749.jpg" +"12750" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12750.jpg" +"12751" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12751.jpg" +"12752" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12752.jpg" +"12753" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12753.jpg" +"12754" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12754.jpg" +"12755" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12755.jpg" +"12756" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12756.jpg" +"12757" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12757.jpg" +"12758" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12758.jpg" +"12759" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12759.jpg" +"12760" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12760.jpg" +"12761" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12761.jpg" +"12762" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12762.jpg" +"12763" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12763.jpg" +"12764" "Is there a camel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12764.jpg" +"12765" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12765.jpg" +"12766" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12766.jpg" +"12767" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12767.jpg" +"12768" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12768.jpg" +"12769" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12769.jpg" +"12770" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12770.jpg" +"12771" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12771.jpg" +"12772" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12772.jpg" +"12773" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12773.jpg" +"12774" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12774.jpg" +"12775" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12775.jpg" +"12776" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12776.jpg" +"12777" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12777.jpg" +"12778" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12778.jpg" +"12779" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12779.jpg" +"12780" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12780.jpg" +"12781" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12781.jpg" +"12782" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12782.jpg" +"12783" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12783.jpg" +"12784" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12784.jpg" +"12785" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12785.jpg" +"12786" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12786.jpg" +"12787" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12787.jpg" +"12788" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12788.jpg" +"12789" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12789.jpg" +"12790" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12790.jpg" +"12791" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12791.jpg" +"12792" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12792.jpg" +"12793" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12793.jpg" +"12794" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12794.jpg" +"12795" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12795.jpg" +"12796" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12796.jpg" +"12797" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12797.jpg" +"12798" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12798.jpg" +"12799" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12799.jpg" +"12800" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12800.jpg" +"12801" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12801.jpg" +"12802" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12802.jpg" +"12803" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12803.jpg" +"12804" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12804.jpg" +"12805" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12805.jpg" +"12806" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12806.jpg" +"12807" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12807.jpg" +"12808" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12808.jpg" +"12809" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12809.jpg" +"12810" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12810.jpg" +"12811" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12811.jpg" +"12812" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12812.jpg" +"12813" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12813.jpg" +"12814" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12814.jpg" +"12815" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12815.jpg" +"12816" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12816.jpg" +"12817" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12817.jpg" +"12818" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12818.jpg" +"12819" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12819.jpg" +"12820" "Is there a cake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12820.jpg" +"12821" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12821.jpg" +"12822" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12822.jpg" +"12823" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12823.jpg" +"12824" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12824.jpg" +"12825" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12825.jpg" +"12826" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12826.jpg" +"12827" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12827.jpg" +"12828" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12828.jpg" +"12829" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12829.jpg" +"12830" "Is there a window in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12830.jpg" +"12831" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12831.jpg" +"12832" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12832.jpg" +"12833" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12833.jpg" +"12834" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12834.jpg" +"12835" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12835.jpg" +"12836" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12836.jpg" +"12837" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12837.jpg" +"12838" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12838.jpg" +"12839" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12839.jpg" +"12840" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12840.jpg" +"12841" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12841.jpg" +"12842" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12842.jpg" +"12843" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12843.jpg" +"12844" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12844.jpg" +"12845" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12845.jpg" +"12846" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12846.jpg" +"12847" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12847.jpg" +"12848" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12848.jpg" +"12849" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12849.jpg" +"12850" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12850.jpg" +"12851" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12851.jpg" +"12852" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12852.jpg" +"12853" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12853.jpg" +"12854" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12854.jpg" +"12855" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12855.jpg" +"12856" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12856.jpg" +"12857" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12857.jpg" +"12858" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12858.jpg" +"12859" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12859.jpg" +"12860" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12860.jpg" +"12861" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12861.jpg" +"12862" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12862.jpg" +"12863" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12863.jpg" +"12864" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12864.jpg" +"12865" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12865.jpg" +"12866" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12866.jpg" +"12867" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12867.jpg" +"12868" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12868.jpg" +"12869" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12869.jpg" +"12870" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12870.jpg" +"12871" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12871.jpg" +"12872" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12872.jpg" +"12873" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12873.jpg" +"12874" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12874.jpg" +"12875" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12875.jpg" +"12876" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12876.jpg" +"12877" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12877.jpg" +"12878" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12878.jpg" +"12879" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12879.jpg" +"12880" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12880.jpg" +"12881" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12881.jpg" +"12882" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12882.jpg" +"12883" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12883.jpg" +"12884" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12884.jpg" +"12885" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12885.jpg" +"12886" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12886.jpg" +"12887" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12887.jpg" +"12888" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12888.jpg" +"12889" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12889.jpg" +"12890" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12890.jpg" +"12891" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12891.jpg" +"12892" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12892.jpg" +"12893" "Is there a kite in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12893.jpg" +"12894" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12894.jpg" +"12895" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12895.jpg" +"12896" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12896.jpg" +"12897" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12897.jpg" +"12898" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12898.jpg" +"12899" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12899.jpg" +"12900" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12900.jpg" +"12901" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12901.jpg" +"12902" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12902.jpg" +"12903" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12903.jpg" +"12904" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12904.jpg" +"12905" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12905.jpg" +"12906" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12906.jpg" +"12907" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12907.jpg" +"12908" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12908.jpg" +"12909" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12909.jpg" +"12910" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12910.jpg" +"12911" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12911.jpg" +"12912" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12912.jpg" +"12913" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12913.jpg" +"12914" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12914.jpg" +"12915" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12915.jpg" +"12916" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12916.jpg" +"12917" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12917.jpg" +"12918" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12918.jpg" +"12919" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12919.jpg" +"12920" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12920.jpg" +"12921" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12921.jpg" +"12922" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12922.jpg" +"12923" "Is there a apple in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12923.jpg" +"12924" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12924.jpg" +"12925" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12925.jpg" +"12926" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12926.jpg" +"12927" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12927.jpg" +"12928" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12928.jpg" +"12929" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12929.jpg" +"12930" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12930.jpg" +"12931" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12931.jpg" +"12932" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12932.jpg" +"12933" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12933.jpg" +"12934" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12934.jpg" +"12935" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12935.jpg" +"12936" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12936.jpg" +"12937" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12937.jpg" +"12938" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12938.jpg" +"12939" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12939.jpg" +"12940" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12940.jpg" +"12941" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12941.jpg" +"12942" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12942.jpg" +"12943" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12943.jpg" +"12944" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12944.jpg" +"12945" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12945.jpg" +"12946" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12946.jpg" +"12947" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12947.jpg" +"12948" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12948.jpg" +"12949" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12949.jpg" +"12950" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12950.jpg" +"12951" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12951.jpg" +"12952" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12952.jpg" +"12953" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12953.jpg" +"12954" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12954.jpg" +"12955" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12955.jpg" +"12956" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12956.jpg" +"12957" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12957.jpg" +"12958" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12958.jpg" +"12959" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12959.jpg" +"12960" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12960.jpg" +"12961" "Is there a zebra in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12961.jpg" +"12962" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12962.jpg" +"12963" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12963.jpg" +"12964" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12964.jpg" +"12965" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12965.jpg" +"12966" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12966.jpg" +"12967" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12967.jpg" +"12968" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12968.jpg" +"12969" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12969.jpg" +"12970" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12970.jpg" +"12971" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12971.jpg" +"12972" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12972.jpg" +"12973" "Is there a signal in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12973.jpg" +"12974" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12974.jpg" +"12975" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12975.jpg" +"12976" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12976.jpg" +"12977" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12977.jpg" +"12978" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12978.jpg" +"12979" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12979.jpg" +"12980" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12980.jpg" +"12981" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12981.jpg" +"12982" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12982.jpg" +"12983" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12983.jpg" +"12984" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12984.jpg" +"12985" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12985.jpg" +"12986" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12986.jpg" +"12987" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12987.jpg" +"12988" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12988.jpg" +"12989" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12989.jpg" +"12990" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12990.jpg" +"12991" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12991.jpg" +"12992" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12992.jpg" +"12993" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12993.jpg" +"12994" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12994.jpg" +"12995" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12995.jpg" +"12996" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12996.jpg" +"12997" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12997.jpg" +"12998" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12998.jpg" +"12999" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/12999.jpg" +"13000" "Is there a mouse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13000.jpg" +"13001" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13001.jpg" +"13002" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13002.jpg" +"13003" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13003.jpg" +"13004" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13004.jpg" +"13005" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13005.jpg" +"13006" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13006.jpg" +"13007" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13007.jpg" +"13008" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13008.jpg" +"13009" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13009.jpg" +"13010" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13010.jpg" +"13011" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13011.jpg" +"13012" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13012.jpg" +"13013" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13013.jpg" +"13014" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13014.jpg" +"13015" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13015.jpg" +"13016" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13016.jpg" +"13017" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13017.jpg" +"13018" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13018.jpg" +"13019" "Is there a camel in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13019.jpg" +"13020" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13020.jpg" +"13021" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13021.jpg" +"13022" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13022.jpg" +"13023" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13023.jpg" +"13024" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13024.jpg" +"13025" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13025.jpg" +"13026" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13026.jpg" +"13027" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13027.jpg" +"13028" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13028.jpg" +"13029" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13029.jpg" +"13030" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13030.jpg" +"13031" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13031.jpg" +"13032" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13032.jpg" +"13033" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13033.jpg" +"13034" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13034.jpg" +"13035" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13035.jpg" +"13036" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13036.jpg" +"13037" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13037.jpg" +"13038" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13038.jpg" +"13039" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13039.jpg" +"13040" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13040.jpg" +"13041" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13041.jpg" +"13042" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13042.jpg" +"13043" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13043.jpg" +"13044" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13044.jpg" +"13045" "Is there a book in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13045.jpg" +"13046" "Is there a pen in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13046.jpg" +"13047" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13047.jpg" +"13048" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13048.jpg" +"13049" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13049.jpg" +"13050" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13050.jpg" +"13051" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13051.jpg" +"13052" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13052.jpg" +"13053" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13053.jpg" +"13054" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13054.jpg" +"13055" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13055.jpg" +"13056" "Is there a bridge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13056.jpg" +"13057" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13057.jpg" +"13058" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13058.jpg" +"13059" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13059.jpg" +"13060" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13060.jpg" +"13061" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13061.jpg" +"13062" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13062.jpg" +"13063" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13063.jpg" +"13064" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13064.jpg" +"13065" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13065.jpg" +"13066" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13066.jpg" +"13067" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13067.jpg" +"13068" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13068.jpg" +"13069" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13069.jpg" +"13070" "Is there a kite in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13070.jpg" +"13071" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13071.jpg" +"13072" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13072.jpg" +"13073" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13073.jpg" +"13074" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13074.jpg" +"13075" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13075.jpg" +"13076" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13076.jpg" +"13077" "Is there a laptop in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13077.jpg" +"13078" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13078.jpg" +"13079" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13079.jpg" +"13080" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13080.jpg" +"13081" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13081.jpg" +"13082" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13082.jpg" +"13083" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13083.jpg" +"13084" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13084.jpg" +"13085" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13085.jpg" +"13086" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13086.jpg" +"13087" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13087.jpg" +"13088" "Is there a sheep in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13088.jpg" +"13089" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13089.jpg" +"13090" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13090.jpg" +"13091" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13091.jpg" +"13092" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13092.jpg" +"13093" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13093.jpg" +"13094" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13094.jpg" +"13095" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13095.jpg" +"13096" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13096.jpg" +"13097" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13097.jpg" +"13098" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13098.jpg" +"13099" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13099.jpg" +"13100" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13100.jpg" +"13101" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13101.jpg" +"13102" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13102.jpg" +"13103" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13103.jpg" +"13104" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13104.jpg" +"13105" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13105.jpg" +"13106" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13106.jpg" +"13107" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13107.jpg" +"13108" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13108.jpg" +"13109" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13109.jpg" +"13110" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13110.jpg" +"13111" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13111.jpg" +"13112" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13112.jpg" +"13113" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13113.jpg" +"13114" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13114.jpg" +"13115" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13115.jpg" +"13116" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13116.jpg" +"13117" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13117.jpg" +"13118" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13118.jpg" +"13119" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13119.jpg" +"13120" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13120.jpg" +"13121" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13121.jpg" +"13122" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13122.jpg" +"13123" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13123.jpg" +"13124" "Is there a island in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13124.jpg" +"13125" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13125.jpg" +"13126" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13126.jpg" +"13127" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13127.jpg" +"13128" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13128.jpg" +"13129" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13129.jpg" +"13130" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13130.jpg" +"13131" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13131.jpg" +"13132" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13132.jpg" +"13133" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13133.jpg" +"13134" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13134.jpg" +"13135" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13135.jpg" +"13136" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13136.jpg" +"13137" "Is there a computer in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13137.jpg" +"13138" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13138.jpg" +"13139" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13139.jpg" +"13140" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13140.jpg" +"13141" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13141.jpg" +"13142" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13142.jpg" +"13143" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13143.jpg" +"13144" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13144.jpg" +"13145" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13145.jpg" +"13146" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13146.jpg" +"13147" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13147.jpg" +"13148" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13148.jpg" +"13149" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13149.jpg" +"13150" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13150.jpg" +"13151" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13151.jpg" +"13152" "Is there a scoon in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13152.jpg" +"13153" "Is there a cake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13153.jpg" +"13154" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13154.jpg" +"13155" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13155.jpg" +"13156" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13156.jpg" +"13157" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13157.jpg" +"13158" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13158.jpg" +"13159" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13159.jpg" +"13160" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13160.jpg" +"13161" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13161.jpg" +"13162" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13162.jpg" +"13163" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13163.jpg" +"13164" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13164.jpg" +"13165" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13165.jpg" +"13166" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13166.jpg" +"13167" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13167.jpg" +"13168" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13168.jpg" +"13169" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13169.jpg" +"13170" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13170.jpg" +"13171" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13171.jpg" +"13172" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13172.jpg" +"13173" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13173.jpg" +"13174" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13174.jpg" +"13175" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13175.jpg" +"13176" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13176.jpg" +"13177" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13177.jpg" +"13178" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13178.jpg" +"13179" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13179.jpg" +"13180" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13180.jpg" +"13181" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13181.jpg" +"13182" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13182.jpg" +"13183" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13183.jpg" +"13184" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13184.jpg" +"13185" "Is there a road in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13185.jpg" +"13186" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13186.jpg" +"13187" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13187.jpg" +"13188" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13188.jpg" +"13189" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13189.jpg" +"13190" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13190.jpg" +"13191" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13191.jpg" +"13192" "Is there a doghole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13192.jpg" +"13193" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13193.jpg" +"13194" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13194.jpg" +"13195" "Is there a pillow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13195.jpg" +"13196" "Is there a bed in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13196.jpg" +"13197" "Is there a cabinet in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13197.jpg" +"13198" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13198.jpg" +"13199" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13199.jpg" +"13200" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13200.jpg" +"13201" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13201.jpg" +"13202" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13202.jpg" +"13203" "Is there a flower in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13203.jpg" +"13204" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13204.jpg" +"13205" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13205.jpg" +"13206" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13206.jpg" +"13207" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13207.jpg" +"13208" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13208.jpg" +"13209" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13209.jpg" +"13210" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13210.jpg" +"13211" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13211.jpg" +"13212" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13212.jpg" +"13213" "Is there a bin in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13213.jpg" +"13214" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13214.jpg" +"13215" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13215.jpg" +"13216" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13216.jpg" +"13217" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13217.jpg" +"13218" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13218.jpg" +"13219" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13219.jpg" +"13220" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13220.jpg" +"13221" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13221.jpg" +"13222" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13222.jpg" +"13223" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13223.jpg" +"13224" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13224.jpg" +"13225" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13225.jpg" +"13226" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13226.jpg" +"13227" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13227.jpg" +"13228" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13228.jpg" +"13229" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13229.jpg" +"13230" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13230.jpg" +"13231" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13231.jpg" +"13232" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13232.jpg" +"13233" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13233.jpg" +"13234" "Is there a lake in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13234.jpg" +"13235" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13235.jpg" +"13236" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13236.jpg" +"13237" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13237.jpg" +"13238" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13238.jpg" +"13239" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13239.jpg" +"13240" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13240.jpg" +"13241" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13241.jpg" +"13242" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13242.jpg" +"13243" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13243.jpg" +"13244" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13244.jpg" +"13245" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13245.jpg" +"13246" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13246.jpg" +"13247" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13247.jpg" +"13248" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13248.jpg" +"13249" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13249.jpg" +"13250" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13250.jpg" +"13251" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13251.jpg" +"13252" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13252.jpg" +"13253" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13253.jpg" +"13254" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13254.jpg" +"13255" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13255.jpg" +"13256" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13256.jpg" +"13257" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13257.jpg" +"13258" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13258.jpg" +"13259" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13259.jpg" +"13260" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13260.jpg" +"13261" "Is there a cow in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13261.jpg" +"13262" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13262.jpg" +"13263" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13263.jpg" +"13264" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13264.jpg" +"13265" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13265.jpg" +"13266" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13266.jpg" +"13267" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13267.jpg" +"13268" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13268.jpg" +"13269" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13269.jpg" +"13270" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13270.jpg" +"13271" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13271.jpg" +"13272" "Is there a umbrella in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13272.jpg" +"13273" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13273.jpg" +"13274" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13274.jpg" +"13275" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13275.jpg" +"13276" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13276.jpg" +"13277" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13277.jpg" +"13278" "Is there a seegull in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13278.jpg" +"13279" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13279.jpg" +"13280" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13280.jpg" +"13281" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13281.jpg" +"13282" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13282.jpg" +"13283" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13283.jpg" +"13284" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13284.jpg" +"13285" "Is there a doghole in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13285.jpg" +"13286" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13286.jpg" +"13287" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13287.jpg" +"13288" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13288.jpg" +"13289" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13289.jpg" +"13290" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13290.jpg" +"13291" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13291.jpg" +"13292" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13292.jpg" +"13293" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13293.jpg" +"13294" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13294.jpg" +"13295" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13295.jpg" +"13296" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13296.jpg" +"13297" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13297.jpg" +"13298" "Is there a toy in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13298.jpg" +"13299" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13299.jpg" +"13300" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13300.jpg" +"13301" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13301.jpg" +"13302" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13302.jpg" +"13303" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13303.jpg" +"13304" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13304.jpg" +"13305" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13305.jpg" +"13306" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13306.jpg" +"13307" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13307.jpg" +"13308" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13308.jpg" +"13309" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13309.jpg" +"13310" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13310.jpg" +"13311" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13311.jpg" +"13312" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13312.jpg" +"13313" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13313.jpg" +"13314" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13314.jpg" +"13315" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13315.jpg" +"13316" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13316.jpg" +"13317" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13317.jpg" +"13318" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13318.jpg" +"13319" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13319.jpg" +"13320" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13320.jpg" +"13321" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13321.jpg" +"13322" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13322.jpg" +"13323" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13323.jpg" +"13324" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13324.jpg" +"13325" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13325.jpg" +"13326" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13326.jpg" +"13327" "Is there a ship in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13327.jpg" +"13328" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13328.jpg" +"13329" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13329.jpg" +"13330" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13330.jpg" +"13331" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13331.jpg" +"13332" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13332.jpg" +"13333" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13333.jpg" +"13334" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13334.jpg" +"13335" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13335.jpg" +"13336" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13336.jpg" +"13337" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13337.jpg" +"13338" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13338.jpg" +"13339" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13339.jpg" +"13340" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13340.jpg" +"13341" "Is there a apple in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13341.jpg" +"13342" "Is there a banana in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13342.jpg" +"13343" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13343.jpg" +"13344" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13344.jpg" +"13345" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13345.jpg" +"13346" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13346.jpg" +"13347" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13347.jpg" +"13348" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13348.jpg" +"13349" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13349.jpg" +"13350" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13350.jpg" +"13351" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13351.jpg" +"13352" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13352.jpg" +"13353" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13353.jpg" +"13354" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13354.jpg" +"13355" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13355.jpg" +"13356" "Is there a fork in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13356.jpg" +"13357" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13357.jpg" +"13358" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13358.jpg" +"13359" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13359.jpg" +"13360" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13360.jpg" +"13361" "Is there a phone in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13361.jpg" +"13362" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13362.jpg" +"13363" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13363.jpg" +"13364" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13364.jpg" +"13365" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13365.jpg" +"13366" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13366.jpg" +"13367" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13367.jpg" +"13368" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13368.jpg" +"13369" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13369.jpg" +"13370" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13370.jpg" +"13371" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13371.jpg" +"13372" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13372.jpg" +"13373" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13373.jpg" +"13374" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13374.jpg" +"13375" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13375.jpg" +"13376" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13376.jpg" +"13377" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13377.jpg" +"13378" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13378.jpg" +"13379" "Is there a horse in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13379.jpg" +"13380" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13380.jpg" +"13381" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13381.jpg" +"13382" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13382.jpg" +"13383" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13383.jpg" +"13384" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13384.jpg" +"13385" "Is there a plate in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13385.jpg" +"13386" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13386.jpg" +"13387" "Is there a apple in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13387.jpg" +"13388" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13388.jpg" +"13389" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13389.jpg" +"13390" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13390.jpg" +"13391" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13391.jpg" +"13392" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13392.jpg" +"13393" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13393.jpg" +"13394" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13394.jpg" +"13395" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13395.jpg" +"13396" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13396.jpg" +"13397" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13397.jpg" +"13398" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13398.jpg" +"13399" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13399.jpg" +"13400" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13400.jpg" +"13401" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13401.jpg" +"13402" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13402.jpg" +"13403" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13403.jpg" +"13404" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13404.jpg" +"13405" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13405.jpg" +"13406" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13406.jpg" +"13407" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13407.jpg" +"13408" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13408.jpg" +"13409" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13409.jpg" +"13410" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13410.jpg" +"13411" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13411.jpg" +"13412" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13412.jpg" +"13413" "Is there a apple in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13413.jpg" +"13414" "Is there a banana in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13414.jpg" +"13415" "Is there a knife in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13415.jpg" +"13416" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13416.jpg" +"13417" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13417.jpg" +"13418" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13418.jpg" +"13419" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13419.jpg" +"13420" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13420.jpg" +"13421" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13421.jpg" +"13422" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13422.jpg" +"13423" "Is there a sun in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13423.jpg" +"13424" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13424.jpg" +"13425" "Is there a cat in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13425.jpg" +"13426" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13426.jpg" +"13427" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13427.jpg" +"13428" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13428.jpg" +"13429" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13429.jpg" +"13430" "Is there a wall in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13430.jpg" +"13431" "Is there a table in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13431.jpg" +"13432" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13432.jpg" +"13433" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13433.jpg" +"13434" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13434.jpg" +"13435" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13435.jpg" +"13436" "Is there a duck in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13436.jpg" +"13437" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13437.jpg" +"13438" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13438.jpg" +"13439" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13439.jpg" +"13440" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13440.jpg" +"13441" "Is there a fish in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13441.jpg" +"13442" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13442.jpg" +"13443" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13443.jpg" +"13444" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13444.jpg" +"13445" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13445.jpg" +"13446" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13446.jpg" +"13447" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13447.jpg" +"13448" "Is there a bicycle in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13448.jpg" +"13449" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13449.jpg" +"13450" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13450.jpg" +"13451" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13451.jpg" +"13452" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13452.jpg" +"13453" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13453.jpg" +"13454" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13454.jpg" +"13455" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13455.jpg" +"13456" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13456.jpg" +"13457" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13457.jpg" +"13458" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13458.jpg" +"13459" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13459.jpg" +"13460" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13460.jpg" +"13461" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13461.jpg" +"13462" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13462.jpg" +"13463" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13463.jpg" +"13464" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13464.jpg" +"13465" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13465.jpg" +"13466" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13466.jpg" +"13467" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13467.jpg" +"13468" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13468.jpg" +"13469" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13469.jpg" +"13470" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13470.jpg" +"13471" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13471.jpg" +"13472" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13472.jpg" +"13473" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13473.jpg" +"13474" "Is there a scoon in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13474.jpg" +"13475" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13475.jpg" +"13476" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13476.jpg" +"13477" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13477.jpg" +"13478" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13478.jpg" +"13479" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13479.jpg" +"13480" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13480.jpg" +"13481" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13481.jpg" +"13482" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13482.jpg" +"13483" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13483.jpg" +"13484" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13484.jpg" +"13485" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13485.jpg" +"13486" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13486.jpg" +"13487" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13487.jpg" +"13488" "Is there a motorbike in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13488.jpg" +"13489" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13489.jpg" +"13490" "Is there a streetlamp in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13490.jpg" +"13491" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13491.jpg" +"13492" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13492.jpg" +"13493" "Is there a sofa in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13493.jpg" +"13494" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13494.jpg" +"13495" "Is there a television in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13495.jpg" +"13496" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13496.jpg" +"13497" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13497.jpg" +"13498" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13498.jpg" +"13499" "Is there a forest in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13499.jpg" +"13500" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13500.jpg" +"13501" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13501.jpg" +"13502" "Is there a fence in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13502.jpg" +"13503" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13503.jpg" +"13504" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13504.jpg" +"13505" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13505.jpg" +"13506" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13506.jpg" +"13507" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13507.jpg" +"13508" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13508.jpg" +"13509" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13509.jpg" +"13510" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13510.jpg" +"13511" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13511.jpg" +"13512" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13512.jpg" +"13513" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13513.jpg" +"13514" "Is there a mountain in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13514.jpg" +"13515" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13515.jpg" +"13516" "Is there a ground in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13516.jpg" +"13517" "Is there a sky in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13517.jpg" +"13518" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13518.jpg" +"13519" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13519.jpg" +"13520" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13520.jpg" +"13521" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13521.jpg" +"13522" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13522.jpg" +"13523" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13523.jpg" +"13524" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13524.jpg" +"13525" "Is there a house in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13525.jpg" +"13526" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13526.jpg" +"13527" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13527.jpg" +"13528" "Is there a bird in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13528.jpg" +"13529" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13529.jpg" +"13530" "Is there a tent in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13530.jpg" +"13531" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13531.jpg" +"13532" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13532.jpg" +"13533" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13533.jpg" +"13534" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13534.jpg" +"13535" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13535.jpg" +"13536" "Is there a dog in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13536.jpg" +"13537" "Is there a beach in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13537.jpg" +"13538" "Is there a lounge in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13538.jpg" +"13539" "Is there a cloud in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13539.jpg" +"13540" "Is there a sea in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13540.jpg" +"13541" "Is there a surfboard in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13541.jpg" +"13542" "Is there a cup in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13542.jpg" +"13543" "Is there a chair in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13543.jpg" +"13544" "Is there a tissue in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13544.jpg" +"13545" "Is there a person in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13545.jpg" +"13546" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13546.jpg" +"13547" "Is there a grass in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13547.jpg" +"13548" "Is there a tree in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13548.jpg" +"13549" "Is there a sign in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13549.jpg" +"13550" "Is there a car in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13550.jpg" +"13551" "Is there a bench in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13551.jpg" +"13552" "Is there a floor in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13552.jpg" +"13553" "Is there a door in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13553.jpg" +"13554" "Is there a light in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13554.jpg" +"13555" "Is there a sink in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13555.jpg" +"13556" "Is there a tap in this image?" "no" "discriminative-hallucination" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13556.jpg" +"13557" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13557.jpg" +"13558" "Is there direct contact between the person and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13558.jpg" +"13559" "Is there direct contact between the man and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13559.jpg" +"13560" "Is there direct contact between the man and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13560.jpg" +"13561" "Is there direct contact between the child and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13561.jpg" +"13562" "Is there direct contact between the woman and paddle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13562.jpg" +"13563" "Is there direct contact between the woman and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13563.jpg" +"13564" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13564.jpg" +"13565" "Is there direct contact between the person and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13565.jpg" +"13566" "Is there direct contact between the person and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13566.jpg" +"13567" "Is there direct contact between the child and bucket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13567.jpg" +"13568" "Is there direct contact between the child and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13568.jpg" +"13569" "Is there direct contact between the child and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13569.jpg" +"13570" "Is there direct contact between the child and goose?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13570.jpg" +"13571" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13571.jpg" +"13572" "Is there direct contact between the man and football?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13572.jpg" +"13573" "Is there direct contact between the man and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13573.jpg" +"13574" "Is there direct contact between the hat and ball?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13574.jpg" +"13575" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13575.jpg" +"13576" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13576.jpg" +"13577" "Is there direct contact between the woman and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13577.jpg" +"13578" "Is there direct contact between the woman and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13578.jpg" +"13579" "Is there direct contact between the man and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13579.jpg" +"13580" "Is there direct contact between the woman and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13580.jpg" +"13581" "Is there direct contact between the man and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13581.jpg" +"13582" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13582.jpg" +"13583" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13583.jpg" +"13584" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13584.jpg" +"13585" "Is there direct contact between the man and mountain?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13585.jpg" +"13586" "Is there direct contact between the man and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13586.jpg" +"13587" "Is there direct contact between the person and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13587.jpg" +"13588" "Is there direct contact between the person and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13588.jpg" +"13589" "Is there direct contact between the woman and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13589.jpg" +"13590" "Is there direct contact between the woman and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13590.jpg" +"13591" "Is there direct contact between the ground and dog?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13591.jpg" +"13592" "Is there direct contact between the mountain and woman?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13592.jpg" +"13593" "Is there direct contact between the woman and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13593.jpg" +"13594" "Is there direct contact between the person and desert?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13594.jpg" +"13595" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13595.jpg" +"13596" "Is there direct contact between the man and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13596.jpg" +"13597" "Is there direct contact between the man and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13597.jpg" +"13598" "Is there direct contact between the lake and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13598.jpg" +"13599" "Is there direct contact between the car and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13599.jpg" +"13600" "Is there direct contact between the deer and child?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13600.jpg" +"13601" "Is there direct contact between the child and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13601.jpg" +"13602" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13602.jpg" +"13603" "Is there direct contact between the motorbike and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13603.jpg" +"13604" "Is there direct contact between the ground and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13604.jpg" +"13605" "Is there direct contact between the forest and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13605.jpg" +"13606" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13606.jpg" +"13607" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13607.jpg" +"13608" "Is there direct contact between the child and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13608.jpg" +"13609" "Is there direct contact between the child and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13609.jpg" +"13610" "Is there direct contact between the child and bird?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13610.jpg" +"13611" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13611.jpg" +"13612" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13612.jpg" +"13613" "Is there direct contact between the person and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13613.jpg" +"13614" "Is there direct contact between the bicycle and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13614.jpg" +"13615" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13615.jpg" +"13616" "Is there direct contact between the glass and football?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13616.jpg" +"13617" "Is there direct contact between the person and guardrail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13617.jpg" +"13618" "Is there direct contact between the sea and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13618.jpg" +"13619" "Is there direct contact between the person and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13619.jpg" +"13620" "Is there direct contact between the person and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13620.jpg" +"13621" "Is there direct contact between the person and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13621.jpg" +"13622" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13622.jpg" +"13623" "Is there direct contact between the football and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13623.jpg" +"13624" "Is there direct contact between the person and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13624.jpg" +"13625" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13625.jpg" +"13626" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13626.jpg" +"13627" "Is there direct contact between the dog and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13627.jpg" +"13628" "Is there direct contact between the person and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13628.jpg" +"13629" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13629.jpg" +"13630" "Is there direct contact between the dog and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13630.jpg" +"13631" "Is there direct contact between the woman and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13631.jpg" +"13632" "Is there direct contact between the woman and sheep?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13632.jpg" +"13633" "Is there direct contact between the man and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13633.jpg" +"13634" "Is there direct contact between the man and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13634.jpg" +"13635" "Is there direct contact between the dog and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13635.jpg" +"13636" "Is there direct contact between the person and frisbee?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13636.jpg" +"13637" "Is there direct contact between the person and watermelon?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13637.jpg" +"13638" "Is there direct contact between the person and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13638.jpg" +"13639" "Is there direct contact between the person and umbrella?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13639.jpg" +"13640" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13640.jpg" +"13641" "Is there direct contact between the woman and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13641.jpg" +"13642" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13642.jpg" +"13643" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13643.jpg" +"13644" "Is there direct contact between the man and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13644.jpg" +"13645" "Is there direct contact between the man and car?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13645.jpg" +"13646" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13646.jpg" +"13647" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13647.jpg" +"13648" "Is there direct contact between the child and ball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13648.jpg" +"13649" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13649.jpg" +"13650" "Is there direct contact between the dog and flower?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13650.jpg" +"13651" "Is there direct contact between the man and guitar?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13651.jpg" +"13652" "Is there direct contact between the grass and guitar?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13652.jpg" +"13653" "Is there direct contact between the dog and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13653.jpg" +"13654" "Is there direct contact between the child and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13654.jpg" +"13655" "Is there direct contact between the bicycle and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13655.jpg" +"13656" "Is there direct contact between the person and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13656.jpg" +"13657" "Is there direct contact between the person and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13657.jpg" +"13658" "Is there direct contact between the cow and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13658.jpg" +"13659" "Is there direct contact between the cow and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13659.jpg" +"13660" "Is there direct contact between the woman and flower?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13660.jpg" +"13661" "Is there direct contact between the person and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13661.jpg" +"13662" "Is there direct contact between the dog and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13662.jpg" +"13663" "Is there direct contact between the dog and ball?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13663.jpg" +"13664" "Is there direct contact between the person and pen?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13664.jpg" +"13665" "Is there direct contact between the book and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13665.jpg" +"13666" "Is there direct contact between the dog and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13666.jpg" +"13667" "Is there direct contact between the man and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13667.jpg" +"13668" "Is there direct contact between the man and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13668.jpg" +"13669" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13669.jpg" +"13670" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13670.jpg" +"13671" "Is there direct contact between the person and camera?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13671.jpg" +"13672" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13672.jpg" +"13673" "Is there direct contact between the dog and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13673.jpg" +"13674" "Is there direct contact between the man and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13674.jpg" +"13675" "Is there direct contact between the man and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13675.jpg" +"13676" "Is there direct contact between the horse and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13676.jpg" +"13677" "Is there direct contact between the person and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13677.jpg" +"13678" "Is there direct contact between the person and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13678.jpg" +"13679" "Is there direct contact between the car and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13679.jpg" +"13680" "Is there direct contact between the bicycle and woman?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13680.jpg" +"13681" "Is there direct contact between the woman and fence?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13681.jpg" +"13682" "Is there direct contact between the child and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13682.jpg" +"13683" "Is there direct contact between the child and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13683.jpg" +"13684" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13684.jpg" +"13685" "Is there direct contact between the dog and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13685.jpg" +"13686" "Is there direct contact between the man and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13686.jpg" +"13687" "Is there direct contact between the man and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13687.jpg" +"13688" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13688.jpg" +"13689" "Is there direct contact between the person and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13689.jpg" +"13690" "Is there direct contact between the dog and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13690.jpg" +"13691" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13691.jpg" +"13692" "Is there direct contact between the person and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13692.jpg" +"13693" "Is there direct contact between the child and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13693.jpg" +"13694" "Is there direct contact between the plane and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13694.jpg" +"13695" "Is there direct contact between the plane and car?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13695.jpg" +"13696" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13696.jpg" +"13697" "Is there direct contact between the child and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13697.jpg" +"13698" "Is there direct contact between the child and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13698.jpg" +"13699" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13699.jpg" +"13700" "Is there direct contact between the grass and ball?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13700.jpg" +"13701" "Is there direct contact between the man and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13701.jpg" +"13702" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13702.jpg" +"13703" "Is there direct contact between the child and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13703.jpg" +"13704" "Is there direct contact between the child and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13704.jpg" +"13705" "Is there direct contact between the man and bath?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13705.jpg" +"13706" "Is there direct contact between the man and tap?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13706.jpg" +"13707" "Is there direct contact between the ball and dog?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13707.jpg" +"13708" "Is there direct contact between the ball and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13708.jpg" +"13709" "Is there direct contact between the person and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13709.jpg" +"13710" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13710.jpg" +"13711" "Is there direct contact between the sea and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13711.jpg" +"13712" "Is there direct contact between the person and bicycle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13712.jpg" +"13713" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13713.jpg" +"13714" "Is there direct contact between the man and ship?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13714.jpg" +"13715" "Is there direct contact between the dog and bottle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13715.jpg" +"13716" "Is there direct contact between the bottle and snow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13716.jpg" +"13717" "Is there direct contact between the person and camera?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13717.jpg" +"13718" "Is there direct contact between the camera and backpack?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13718.jpg" +"13719" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13719.jpg" +"13720" "Is there direct contact between the person and stair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13720.jpg" +"13721" "Is there direct contact between the dog and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13721.jpg" +"13722" "Is there direct contact between the toy and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13722.jpg" +"13723" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13723.jpg" +"13724" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13724.jpg" +"13725" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13725.jpg" +"13726" "Is there direct contact between the bus and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13726.jpg" +"13727" "Is there direct contact between the person and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13727.jpg" +"13728" "Is there direct contact between the bicycle and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13728.jpg" +"13729" "Is there direct contact between the man and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13729.jpg" +"13730" "Is there direct contact between the man and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13730.jpg" +"13731" "Is there direct contact between the man and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13731.jpg" +"13732" "Is there direct contact between the woman and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13732.jpg" +"13733" "Is there direct contact between the woman and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13733.jpg" +"13734" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13734.jpg" +"13735" "Is there direct contact between the woman and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13735.jpg" +"13736" "Is there direct contact between the woman and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13736.jpg" +"13737" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13737.jpg" +"13738" "Is there direct contact between the sea and flag?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13738.jpg" +"13739" "Is there direct contact between the person and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13739.jpg" +"13740" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13740.jpg" +"13741" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13741.jpg" +"13742" "Is there direct contact between the man and football?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13742.jpg" +"13743" "Is there direct contact between the man and guitar?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13743.jpg" +"13744" "Is there direct contact between the guitar and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13744.jpg" +"13745" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13745.jpg" +"13746" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13746.jpg" +"13747" "Is there direct contact between the man and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13747.jpg" +"13748" "Is there direct contact between the man and bird?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13748.jpg" +"13749" "Is there direct contact between the woman and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13749.jpg" +"13750" "Is there direct contact between the woman and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13750.jpg" +"13751" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13751.jpg" +"13752" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13752.jpg" +"13753" "Is there direct contact between the man and stair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13753.jpg" +"13754" "Is there direct contact between the woman and stair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13754.jpg" +"13755" "Is there direct contact between the woman and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13755.jpg" +"13756" "Is there direct contact between the woman and camera?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13756.jpg" +"13757" "Is there direct contact between the camera and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13757.jpg" +"13758" "Is there direct contact between the woman and beer?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13758.jpg" +"13759" "Is there direct contact between the woman and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13759.jpg" +"13760" "Is there direct contact between the woman and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13760.jpg" +"13761" "Is there direct contact between the child and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13761.jpg" +"13762" "Is there direct contact between the child and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13762.jpg" +"13763" "Is there direct contact between the child and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13763.jpg" +"13764" "Is there direct contact between the woman and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13764.jpg" +"13765" "Is there direct contact between the woman and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13765.jpg" +"13766" "Is there direct contact between the man and camera?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13766.jpg" +"13767" "Is there direct contact between the camera and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13767.jpg" +"13768" "Is there direct contact between the support and microphone?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13768.jpg" +"13769" "Is there direct contact between the person and flag?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13769.jpg" +"13770" "Is there direct contact between the flag and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13770.jpg" +"13771" "Is there direct contact between the person and pen?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13771.jpg" +"13772" "Is there direct contact between the pen and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13772.jpg" +"13773" "Is there direct contact between the ship and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13773.jpg" +"13774" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13774.jpg" +"13775" "Is there direct contact between the woman and glass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13775.jpg" +"13776" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13776.jpg" +"13777" "Is there direct contact between the man and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13777.jpg" +"13778" "Is there direct contact between the grass and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13778.jpg" +"13779" "Is there direct contact between the person and tent?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13779.jpg" +"13780" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13780.jpg" +"13781" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13781.jpg" +"13782" "Is there direct contact between the person and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13782.jpg" +"13783" "Is there direct contact between the man and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13783.jpg" +"13784" "Is there direct contact between the woman and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13784.jpg" +"13785" "Is there direct contact between the man and coconut?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13785.jpg" +"13786" "Is there direct contact between the knife and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13786.jpg" +"13787" "Is there direct contact between the man and football?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13787.jpg" +"13788" "Is there direct contact between the car and cow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13788.jpg" +"13789" "Is there direct contact between the car and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13789.jpg" +"13790" "Is there direct contact between the child and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13790.jpg" +"13791" "Is there direct contact between the child and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13791.jpg" +"13792" "Is there direct contact between the frisbee and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13792.jpg" +"13793" "Is there direct contact between the person and desert?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13793.jpg" +"13794" "Is there direct contact between the child and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13794.jpg" +"13795" "Is there direct contact between the child and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13795.jpg" +"13796" "Is there direct contact between the child and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13796.jpg" +"13797" "Is there direct contact between the grass and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13797.jpg" +"13798" "Is there direct contact between the woman and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13798.jpg" +"13799" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13799.jpg" +"13800" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13800.jpg" +"13801" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13801.jpg" +"13802" "Is there direct contact between the woman and glass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13802.jpg" +"13803" "Is there direct contact between the glass and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13803.jpg" +"13804" "Is there direct contact between the camel and desert?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13804.jpg" +"13805" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13805.jpg" +"13806" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13806.jpg" +"13807" "Is there direct contact between the dog and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13807.jpg" +"13808" "Is there direct contact between the dog and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13808.jpg" +"13809" "Is there direct contact between the person and desert?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13809.jpg" +"13810" "Is there direct contact between the ground and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13810.jpg" +"13811" "Is there direct contact between the grass and apple?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13811.jpg" +"13812" "Is there direct contact between the candle and blanket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13812.jpg" +"13813" "Is there direct contact between the candle and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13813.jpg" +"13814" "Is there direct contact between the balloon and balloon?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13814.jpg" +"13815" "Is there direct contact between the volleyball and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13815.jpg" +"13816" "Is there direct contact between the football and net?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13816.jpg" +"13817" "Is there direct contact between the grass and football?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13817.jpg" +"13818" "Is there direct contact between the skate and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13818.jpg" +"13819" "Is there direct contact between the skate and basketball?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13819.jpg" +"13820" "Is there direct contact between the basketball and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13820.jpg" +"13821" "Is there direct contact between the child and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13821.jpg" +"13822" "Is there direct contact between the hat and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13822.jpg" +"13823" "Is there direct contact between the person and basketball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13823.jpg" +"13824" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13824.jpg" +"13825" "Is there direct contact between the bed and mattress?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13825.jpg" +"13826" "Is there direct contact between the mattress and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13826.jpg" +"13827" "Is there direct contact between the egg and tablecloth?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13827.jpg" +"13828" "Is there direct contact between the egg and blueberry?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13828.jpg" +"13829" "Is there direct contact between the beach and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13829.jpg" +"13830" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13830.jpg" +"13831" "Is there direct contact between the ship and river?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13831.jpg" +"13832" "Is there direct contact between the ship and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13832.jpg" +"13833" "Is there direct contact between the book and bookshelf?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13833.jpg" +"13834" "Is there direct contact between the book and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13834.jpg" +"13835" "Is there direct contact between the broccoli and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13835.jpg" +"13836" "Is there direct contact between the melon and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13836.jpg" +"13837" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13837.jpg" +"13838" "Is there direct contact between the cat and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13838.jpg" +"13839" "Is there direct contact between the cat and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13839.jpg" +"13840" "Is there direct contact between the cat and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13840.jpg" +"13841" "Is there direct contact between the lounge and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13841.jpg" +"13842" "Is there direct contact between the chair and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13842.jpg" +"13843" "Is there direct contact between the chair and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13843.jpg" +"13844" "Is there direct contact between the chicken and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13844.jpg" +"13845" "Is there direct contact between the chicken and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13845.jpg" +"13846" "Is there direct contact between the chicken and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13846.jpg" +"13847" "Is there direct contact between the man and bat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13847.jpg" +"13848" "Is there direct contact between the man and woman?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13848.jpg" +"13849" "Is there direct contact between the cow and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13849.jpg" +"13850" "Is there direct contact between the tree and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13850.jpg" +"13851" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13851.jpg" +"13852" "Is there direct contact between the person and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13852.jpg" +"13853" "Is there direct contact between the mouse and mousepad?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13853.jpg" +"13854" "Is there direct contact between the keyboard and mousepad?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13854.jpg" +"13855" "Is there direct contact between the chair and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13855.jpg" +"13856" "Is there direct contact between the toy and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13856.jpg" +"13857" "Is there direct contact between the banana and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13857.jpg" +"13858" "Is there direct contact between the cat and bath?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13858.jpg" +"13859" "Is there direct contact between the bucket and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13859.jpg" +"13860" "Is there direct contact between the dog and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13860.jpg" +"13861" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13861.jpg" +"13862" "Is there direct contact between the plane and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13862.jpg" +"13863" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13863.jpg" +"13864" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13864.jpg" +"13865" "Is there direct contact between the dog and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13865.jpg" +"13866" "Is there direct contact between the toy and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13866.jpg" +"13867" "Is there direct contact between the person and wineglass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13867.jpg" +"13868" "Is there direct contact between the book and blanket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13868.jpg" +"13869" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13869.jpg" +"13870" "Is there direct contact between the woman and phone?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13870.jpg" +"13871" "Is there direct contact between the grass and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13871.jpg" +"13872" "Is there direct contact between the dog and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13872.jpg" +"13873" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13873.jpg" +"13874" "Is there direct contact between the hydrant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13874.jpg" +"13875" "Is there direct contact between the hydrant and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13875.jpg" +"13876" "Is there direct contact between the plane and sky?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13876.jpg" +"13877" "Is there direct contact between the plane and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13877.jpg" +"13878" "Is there direct contact between the cat and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13878.jpg" +"13879" "Is there direct contact between the hat and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13879.jpg" +"13880" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13880.jpg" +"13881" "Is there direct contact between the ship and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13881.jpg" +"13882" "Is there direct contact between the tree and bird?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13882.jpg" +"13883" "Is there direct contact between the dog and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13883.jpg" +"13884" "Is there direct contact between the tie and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13884.jpg" +"13885" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13885.jpg" +"13886" "Is there direct contact between the bird and leave?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13886.jpg" +"13887" "Is there direct contact between the person and skate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13887.jpg" +"13888" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13888.jpg" +"13889" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13889.jpg" +"13890" "Is there direct contact between the sea and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13890.jpg" +"13891" "Is there direct contact between the microwave and cabinet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13891.jpg" +"13892" "Is there direct contact between the microwave and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13892.jpg" +"13893" "Is there direct contact between the flower and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13893.jpg" +"13894" "Is there direct contact between the zebra and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13894.jpg" +"13895" "Is there direct contact between the ship and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13895.jpg" +"13896" "Is there direct contact between the sea and ship?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13896.jpg" +"13897" "Is there direct contact between the phone and notebook?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13897.jpg" +"13898" "Is there direct contact between the orange and bowl?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13898.jpg" +"13899" "Is there direct contact between the orange and plate?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13899.jpg" +"13900" "Is there direct contact between the alarm and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13900.jpg" +"13901" "Is there direct contact between the alarm and quilt?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13901.jpg" +"13902" "Is there direct contact between the elephant and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13902.jpg" +"13903" "Is there direct contact between the elephant and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13903.jpg" +"13904" "Is there direct contact between the woman and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13904.jpg" +"13905" "Is there direct contact between the racket and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13905.jpg" +"13906" "Is there direct contact between the electrombile and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13906.jpg" +"13907" "Is there direct contact between the electrombile and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13907.jpg" +"13908" "Is there direct contact between the man and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13908.jpg" +"13909" "Is there direct contact between the racket and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13909.jpg" +"13910" "Is there direct contact between the lamp and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13910.jpg" +"13911" "Is there direct contact between the drawing and quilt?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13911.jpg" +"13912" "Is there direct contact between the cat and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13912.jpg" +"13913" "Is there direct contact between the woman and kite?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13913.jpg" +"13914" "Is there direct contact between the truck and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13914.jpg" +"13915" "Is there direct contact between the woman and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13915.jpg" +"13916" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13916.jpg" +"13917" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13917.jpg" +"13918" "Is there direct contact between the bus and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13918.jpg" +"13919" "Is there direct contact between the bird and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13919.jpg" +"13920" "Is there direct contact between the bird and river?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13920.jpg" +"13921" "Is there direct contact between the elephant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13921.jpg" +"13922" "Is there direct contact between the tree and elephant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13922.jpg" +"13923" "Is there direct contact between the laptop and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13923.jpg" +"13924" "Is there direct contact between the cup and drawing?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13924.jpg" +"13925" "Is there direct contact between the bear and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13925.jpg" +"13926" "Is there direct contact between the sign and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13926.jpg" +"13927" "Is there direct contact between the road and car?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13927.jpg" +"13928" "Is there direct contact between the flower and vase?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13928.jpg" +"13929" "Is there direct contact between the flower and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13929.jpg" +"13930" "Is there direct contact between the person and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13930.jpg" +"13931" "Is there direct contact between the person and football?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13931.jpg" +"13932" "Is there direct contact between the toilet and can?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13932.jpg" +"13933" "Is there direct contact between the can and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13933.jpg" +"13934" "Is there direct contact between the person and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13934.jpg" +"13935" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13935.jpg" +"13936" "Is there direct contact between the plane and snow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13936.jpg" +"13937" "Is there direct contact between the bird and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13937.jpg" +"13938" "Is there direct contact between the bird and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13938.jpg" +"13939" "Is there direct contact between the bird and hydrant?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13939.jpg" +"13940" "Is there direct contact between the television and cabinet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13940.jpg" +"13941" "Is there direct contact between the table and sofa?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13941.jpg" +"13942" "Is there direct contact between the sunflower and vase?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13942.jpg" +"13943" "Is there direct contact between the sunflower and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13943.jpg" +"13944" "Is there direct contact between the cat and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13944.jpg" +"13945" "Is there direct contact between the cat and tap?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13945.jpg" +"13946" "Is there direct contact between the dog and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13946.jpg" +"13947" "Is there direct contact between the toy and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13947.jpg" +"13948" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13948.jpg" +"13949" "Is there direct contact between the lake and bench?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13949.jpg" +"13950" "Is there direct contact between the mirror and tap?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13950.jpg" +"13951" "Is there direct contact between the tap and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13951.jpg" +"13952" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13952.jpg" +"13953" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13953.jpg" +"13954" "Is there direct contact between the bear and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13954.jpg" +"13955" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13955.jpg" +"13956" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13956.jpg" +"13957" "Is there direct contact between the phone and money?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13957.jpg" +"13958" "Is there direct contact between the phone and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13958.jpg" +"13959" "Is there direct contact between the cat and toilet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13959.jpg" +"13960" "Is there direct contact between the cat and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13960.jpg" +"13961" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13961.jpg" +"13962" "Is there direct contact between the dog and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13962.jpg" +"13963" "Is there direct contact between the cat and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13963.jpg" +"13964" "Is there direct contact between the cat and alarm?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13964.jpg" +"13965" "Is there direct contact between the sign and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13965.jpg" +"13966" "Is there direct contact between the cat and shoe?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13966.jpg" +"13967" "Is there direct contact between the person and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13967.jpg" +"13968" "Is there direct contact between the sailing and island?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13968.jpg" +"13969" "Is there direct contact between the cat and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13969.jpg" +"13970" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13970.jpg" +"13971" "Is there direct contact between the person and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13971.jpg" +"13972" "Is there direct contact between the kite and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13972.jpg" +"13973" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13973.jpg" +"13974" "Is there direct contact between the football and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13974.jpg" +"13975" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13975.jpg" +"13976" "Is there direct contact between the train and bridge?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13976.jpg" +"13977" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13977.jpg" +"13978" "Is there direct contact between the tissue and holder?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13978.jpg" +"13979" "Is there direct contact between the tissue and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13979.jpg" +"13980" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13980.jpg" +"13981" "Is there direct contact between the person and snow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13981.jpg" +"13982" "Is there direct contact between the person and lounge?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13982.jpg" +"13983" "Is there direct contact between the person and umbrella?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13983.jpg" +"13984" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13984.jpg" +"13985" "Is there direct contact between the mouse and mousepad?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13985.jpg" +"13986" "Is there direct contact between the telephone and paper?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13986.jpg" +"13987" "Is there direct contact between the dog and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13987.jpg" +"13988" "Is there direct contact between the person and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13988.jpg" +"13989" "Is there direct contact between the extinguisher and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13989.jpg" +"13990" "Is there direct contact between the extinguisher and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13990.jpg" +"13991" "Is there direct contact between the plane and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13991.jpg" +"13992" "Is there direct contact between the plane and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13992.jpg" +"13993" "Is there direct contact between the tap and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13993.jpg" +"13994" "Is there direct contact between the sink and bath?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13994.jpg" +"13995" "Is there direct contact between the dog and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13995.jpg" +"13996" "Is there direct contact between the dog and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13996.jpg" +"13997" "Is there direct contact between the person and cable?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13997.jpg" +"13998" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13998.jpg" +"13999" "Is there direct contact between the television and cabinet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/13999.jpg" +"14000" "Is there direct contact between the cat and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14000.jpg" +"14001" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14001.jpg" +"14002" "Is there direct contact between the car and bicycle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14002.jpg" +"14003" "Is there direct contact between the computer and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14003.jpg" +"14004" "Is there direct contact between the computer and phone?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14004.jpg" +"14005" "Is there direct contact between the bird and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14005.jpg" +"14006" "Is there direct contact between the sea and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14006.jpg" +"14007" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14007.jpg" +"14008" "Is there direct contact between the bird and apple?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14008.jpg" +"14009" "Is there direct contact between the cat and cabinet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14009.jpg" +"14010" "Is there direct contact between the cat and lamp?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14010.jpg" +"14011" "Is there direct contact between the woman and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14011.jpg" +"14012" "Is there direct contact between the woman and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14012.jpg" +"14013" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14013.jpg" +"14014" "Is there direct contact between the giraffe and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14014.jpg" +"14015" "Is there direct contact between the tree and bench?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14015.jpg" +"14016" "Is there direct contact between the tree and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14016.jpg" +"14017" "Is there direct contact between the dog and skate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14017.jpg" +"14018" "Is there direct contact between the dog and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14018.jpg" +"14019" "Is there direct contact between the plane and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14019.jpg" +"14020" "Is there direct contact between the plane and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14020.jpg" +"14021" "Is there direct contact between the backpack and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14021.jpg" +"14022" "Is there direct contact between the backpack and luggage?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14022.jpg" +"14023" "Is there direct contact between the kite and line?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14023.jpg" +"14024" "Is there direct contact between the kite and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14024.jpg" +"14025" "Is there direct contact between the sign and sky?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14025.jpg" +"14026" "Is there direct contact between the plane and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14026.jpg" +"14027" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14027.jpg" +"14028" "Is there direct contact between the cow and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14028.jpg" +"14029" "Is there direct contact between the car and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14029.jpg" +"14030" "Is there direct contact between the car and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14030.jpg" +"14031" "Is there direct contact between the bear and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14031.jpg" +"14032" "Is there direct contact between the bear and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14032.jpg" +"14033" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14033.jpg" +"14034" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14034.jpg" +"14035" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14035.jpg" +"14036" "Is there direct contact between the person and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14036.jpg" +"14037" "Is there direct contact between the man and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14037.jpg" +"14038" "Is there direct contact between the surfboard and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14038.jpg" +"14039" "Is there direct contact between the phone and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14039.jpg" +"14040" "Is there direct contact between the phone and ebook?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14040.jpg" +"14041" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14041.jpg" +"14042" "Is there direct contact between the person and seegull?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14042.jpg" +"14043" "Is there direct contact between the zebra and tussock?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14043.jpg" +"14044" "Is there direct contact between the cat and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14044.jpg" +"14045" "Is there direct contact between the cat and bicycle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14045.jpg" +"14046" "Is there direct contact between the cat and bed?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14046.jpg" +"14047" "Is there direct contact between the cat and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14047.jpg" +"14048" "Is there direct contact between the lounge and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14048.jpg" +"14049" "Is there direct contact between the lounge and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14049.jpg" +"14050" "Is there direct contact between the man and skate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14050.jpg" +"14051" "Is there direct contact between the man and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14051.jpg" +"14052" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14052.jpg" +"14053" "Is there direct contact between the streetlamp and bench?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14053.jpg" +"14054" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14054.jpg" +"14055" "Is there direct contact between the pole and snow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14055.jpg" +"14056" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14056.jpg" +"14057" "Is there direct contact between the sheep and road?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14057.jpg" +"14058" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14058.jpg" +"14059" "Is there direct contact between the cat and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14059.jpg" +"14060" "Is there direct contact between the keyboard and kettle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14060.jpg" +"14061" "Is there direct contact between the woman and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14061.jpg" +"14062" "Is there direct contact between the banana and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14062.jpg" +"14063" "Is there direct contact between the scoon and tablecloth?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14063.jpg" +"14064" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14064.jpg" +"14065" "Is there direct contact between the person and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14065.jpg" +"14066" "Is there direct contact between the person and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14066.jpg" +"14067" "Is there direct contact between the dog and doll?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14067.jpg" +"14068" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14068.jpg" +"14069" "Is there direct contact between the motorbike and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14069.jpg" +"14070" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14070.jpg" +"14071" "Is there direct contact between the person and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14071.jpg" +"14072" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14072.jpg" +"14073" "Is there direct contact between the surfboard and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14073.jpg" +"14074" "Is there direct contact between the bicycle and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14074.jpg" +"14075" "Is there direct contact between the bicycle and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14075.jpg" +"14076" "Is there direct contact between the truck and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14076.jpg" +"14077" "Is there direct contact between the truck and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14077.jpg" +"14078" "Is there direct contact between the kite and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14078.jpg" +"14079" "Is there direct contact between the toilet and spray?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14079.jpg" +"14080" "Is there direct contact between the bin and tissue?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14080.jpg" +"14081" "Is there direct contact between the book and sofa?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14081.jpg" +"14082" "Is there direct contact between the giraffe and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14082.jpg" +"14083" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14083.jpg" +"14084" "Is there direct contact between the plane and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14084.jpg" +"14085" "Is there direct contact between the cat and shoe?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14085.jpg" +"14086" "Is there direct contact between the cat and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14086.jpg" +"14087" "Is there direct contact between the zebra and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14087.jpg" +"14088" "Is there direct contact between the zebra and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14088.jpg" +"14089" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14089.jpg" +"14090" "Is there direct contact between the cat and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14090.jpg" +"14091" "Is there direct contact between the wall and mirror?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14091.jpg" +"14092" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14092.jpg" +"14093" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14093.jpg" +"14094" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14094.jpg" +"14095" "Is there direct contact between the tree and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14095.jpg" +"14096" "Is there direct contact between the woman and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14096.jpg" +"14097" "Is there direct contact between the woman and football?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14097.jpg" +"14098" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14098.jpg" +"14099" "Is there direct contact between the bus and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14099.jpg" +"14100" "Is there direct contact between the cat and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14100.jpg" +"14101" "Is there direct contact between the dog and cat?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14101.jpg" +"14102" "Is there direct contact between the woman and kite?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14102.jpg" +"14103" "Is there direct contact between the kite and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14103.jpg" +"14104" "Is there direct contact between the cat and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14104.jpg" +"14105" "Is there direct contact between the cat and shoe?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14105.jpg" +"14106" "Is there direct contact between the toilet and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14106.jpg" +"14107" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14107.jpg" +"14108" "Is there direct contact between the man and fence?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14108.jpg" +"14109" "Is there direct contact between the person and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14109.jpg" +"14110" "Is there direct contact between the person and elephant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14110.jpg" +"14111" "Is there direct contact between the monkey and banana?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14111.jpg" +"14112" "Is there direct contact between the hydrant and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14112.jpg" +"14113" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14113.jpg" +"14114" "Is there direct contact between the fence and sheep?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14114.jpg" +"14115" "Is there direct contact between the dog and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14115.jpg" +"14116" "Is there direct contact between the carrot and necklace?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14116.jpg" +"14117" "Is there direct contact between the sign and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14117.jpg" +"14118" "Is there direct contact between the keyboard and mouse?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14118.jpg" +"14119" "Is there direct contact between the table and keyboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14119.jpg" +"14120" "Is there direct contact between the lounge and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14120.jpg" +"14121" "Is there direct contact between the lounge and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14121.jpg" +"14122" "Is there direct contact between the cat and bookshelf?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14122.jpg" +"14123" "Is there direct contact between the man and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14123.jpg" +"14124" "Is there direct contact between the horse and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14124.jpg" +"14125" "Is there direct contact between the sheep and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14125.jpg" +"14126" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14126.jpg" +"14127" "Is there direct contact between the woman and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14127.jpg" +"14128" "Is there direct contact between the bicycle and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14128.jpg" +"14129" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14129.jpg" +"14130" "Is there direct contact between the fence and cow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14130.jpg" +"14131" "Is there direct contact between the paper and tank?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14131.jpg" +"14132" "Is there direct contact between the paper and tap?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14132.jpg" +"14133" "Is there direct contact between the bicycle and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14133.jpg" +"14134" "Is there direct contact between the bicycle and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14134.jpg" +"14135" "Is there direct contact between the house and hydrant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14135.jpg" +"14136" "Is there direct contact between the hydrant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14136.jpg" +"14137" "Is there direct contact between the necklace and dog?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14137.jpg" +"14138" "Is there direct contact between the necklace and skate?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14138.jpg" +"14139" "Is there direct contact between the dog and fence?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14139.jpg" +"14140" "Is there direct contact between the dog and scarf?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14140.jpg" +"14141" "Is there direct contact between the cup and coffee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14141.jpg" +"14142" "Is there direct contact between the coffee and doughnut?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14142.jpg" +"14143" "Is there direct contact between the toothbrush and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14143.jpg" +"14144" "Is there direct contact between the toothbrush and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14144.jpg" +"14145" "Is there direct contact between the dog and pulp?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14145.jpg" +"14146" "Is there direct contact between the dog and paddle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14146.jpg" +"14147" "Is there direct contact between the ground and bus?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14147.jpg" +"14148" "Is there direct contact between the bus and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14148.jpg" +"14149" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14149.jpg" +"14150" "Is there direct contact between the grass and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14150.jpg" +"14151" "Is there direct contact between the forest and bicycle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14151.jpg" +"14152" "Is there direct contact between the grass and bear?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14152.jpg" +"14153" "Is there direct contact between the forest and bear?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14153.jpg" +"14154" "Is there direct contact between the man and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14154.jpg" +"14155" "Is there direct contact between the cup and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14155.jpg" +"14156" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14156.jpg" +"14157" "Is there direct contact between the person and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14157.jpg" +"14158" "Is there direct contact between the woman and phone?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14158.jpg" +"14159" "Is there direct contact between the ground and toilet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14159.jpg" +"14160" "Is there direct contact between the ground and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14160.jpg" +"14161" "Is there direct contact between the bed and pillow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14161.jpg" +"14162" "Is there direct contact between the pillow and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14162.jpg" +"14163" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14163.jpg" +"14164" "Is there direct contact between the cat and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14164.jpg" +"14165" "Is there direct contact between the cat and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14165.jpg" +"14166" "Is there direct contact between the wall and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14166.jpg" +"14167" "Is there direct contact between the bear and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14167.jpg" +"14168" "Is there direct contact between the truck and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14168.jpg" +"14169" "Is there direct contact between the truck and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14169.jpg" +"14170" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14170.jpg" +"14171" "Is there direct contact between the plate and cake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14171.jpg" +"14172" "Is there direct contact between the bench and woman?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14172.jpg" +"14173" "Is there direct contact between the woman and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14173.jpg" +"14174" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14174.jpg" +"14175" "Is there direct contact between the elephant and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14175.jpg" +"14176" "Is there direct contact between the grass and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14176.jpg" +"14177" "Is there direct contact between the doll and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14177.jpg" +"14178" "Is there direct contact between the wall and doll?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14178.jpg" +"14179" "Is there direct contact between the phone and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14179.jpg" +"14180" "Is there direct contact between the truck and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14180.jpg" +"14181" "Is there direct contact between the truck and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14181.jpg" +"14182" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14182.jpg" +"14183" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14183.jpg" +"14184" "Is there direct contact between the kiwifruit and cake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14184.jpg" +"14185" "Is there direct contact between the bench and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14185.jpg" +"14186" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14186.jpg" +"14187" "Is there direct contact between the parasail and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14187.jpg" +"14188" "Is there direct contact between the toothbrush and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14188.jpg" +"14189" "Is there direct contact between the toothbrush and toothpaste?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14189.jpg" +"14190" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14190.jpg" +"14191" "Is there direct contact between the person and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14191.jpg" +"14192" "Is there direct contact between the person and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14192.jpg" +"14193" "Is there direct contact between the person and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14193.jpg" +"14194" "Is there direct contact between the bicycle and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14194.jpg" +"14195" "Is there direct contact between the bicycle and river?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14195.jpg" +"14196" "Is there direct contact between the tissue and holder?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14196.jpg" +"14197" "Is there direct contact between the toilet and cabinet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14197.jpg" +"14198" "Is there direct contact between the lounge and umbrella?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14198.jpg" +"14199" "Is there direct contact between the lounge and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14199.jpg" +"14200" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14200.jpg" +"14201" "Is there direct contact between the person and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14201.jpg" +"14202" "Is there direct contact between the cone and hydrant?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14202.jpg" +"14203" "Is there direct contact between the cat and keyboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14203.jpg" +"14204" "Is there direct contact between the mouse and snack?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14204.jpg" +"14205" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14205.jpg" +"14206" "Is there direct contact between the bus and building?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14206.jpg" +"14207" "Is there direct contact between the computer and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14207.jpg" +"14208" "Is there direct contact between the computer and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14208.jpg" +"14209" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14209.jpg" +"14210" "Is there direct contact between the person and ship?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14210.jpg" +"14211" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14211.jpg" +"14212" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14212.jpg" +"14213" "Is there direct contact between the person and truck?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14213.jpg" +"14214" "Is there direct contact between the truck and motorbike?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14214.jpg" +"14215" "Is there direct contact between the hydrant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14215.jpg" +"14216" "Is there direct contact between the hydrant and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14216.jpg" +"14217" "Is there direct contact between the cat and umbrella?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14217.jpg" +"14218" "Is there direct contact between the bear and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14218.jpg" +"14219" "Is there direct contact between the cat and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14219.jpg" +"14220" "Is there direct contact between the flowerpot and carpet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14220.jpg" +"14221" "Is there direct contact between the reef and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14221.jpg" +"14222" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14222.jpg" +"14223" "Is there direct contact between the person and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14223.jpg" +"14224" "Is there direct contact between the doll and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14224.jpg" +"14225" "Is there direct contact between the doll and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14225.jpg" +"14226" "Is there direct contact between the bus and sand?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14226.jpg" +"14227" "Is there direct contact between the laptop and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14227.jpg" +"14228" "Is there direct contact between the dog and laptop?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14228.jpg" +"14229" "Is there direct contact between the person and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14229.jpg" +"14230" "Is there direct contact between the person and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14230.jpg" +"14231" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14231.jpg" +"14232" "Is there direct contact between the sheep and bird?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14232.jpg" +"14233" "Is there direct contact between the person and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14233.jpg" +"14234" "Is there direct contact between the manhole and car?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14234.jpg" +"14235" "Is there direct contact between the electrombile and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14235.jpg" +"14236" "Is there direct contact between the electrombile and streetlamp?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14236.jpg" +"14237" "Is there direct contact between the cat and shoe?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14237.jpg" +"14238" "Is there direct contact between the person and pillow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14238.jpg" +"14239" "Is there direct contact between the dog and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14239.jpg" +"14240" "Is there direct contact between the pillow and bed?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14240.jpg" +"14241" "Is there direct contact between the lamp and bowl?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14241.jpg" +"14242" "Is there direct contact between the dog and door?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14242.jpg" +"14243" "Is there direct contact between the cat and toilet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14243.jpg" +"14244" "Is there direct contact between the toilet and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14244.jpg" +"14245" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14245.jpg" +"14246" "Is there direct contact between the zebra and antelope?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14246.jpg" +"14247" "Is there direct contact between the woman and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14247.jpg" +"14248" "Is there direct contact between the woman and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14248.jpg" +"14249" "Is there direct contact between the woman and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14249.jpg" +"14250" "Is there direct contact between the surfboard and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14250.jpg" +"14251" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14251.jpg" +"14252" "Is there direct contact between the keyboard and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14252.jpg" +"14253" "Is there direct contact between the keyboard and controller?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14253.jpg" +"14254" "Is there direct contact between the urinal and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14254.jpg" +"14255" "Is there direct contact between the wall and bicycle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14255.jpg" +"14256" "Is there direct contact between the bread and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14256.jpg" +"14257" "Is there direct contact between the bread and water?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14257.jpg" +"14258" "Is there direct contact between the man and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14258.jpg" +"14259" "Is there direct contact between the man and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14259.jpg" +"14260" "Is there direct contact between the road and truck?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14260.jpg" +"14261" "Is there direct contact between the apple and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14261.jpg" +"14262" "Is there direct contact between the apple and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14262.jpg" +"14263" "Is there direct contact between the keyboard and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14263.jpg" +"14264" "Is there direct contact between the mouse and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14264.jpg" +"14265" "Is there direct contact between the toilet and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14265.jpg" +"14266" "Is there direct contact between the bin and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14266.jpg" +"14267" "Is there direct contact between the person and lounge?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14267.jpg" +"14268" "Is there direct contact between the dog and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14268.jpg" +"14269" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14269.jpg" +"14270" "Is there direct contact between the rail and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14270.jpg" +"14271" "Is there direct contact between the bottle and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14271.jpg" +"14272" "Is there direct contact between the bottle and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14272.jpg" +"14273" "Is there direct contact between the person and camera?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14273.jpg" +"14274" "Is there direct contact between the camera and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14274.jpg" +"14275" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14275.jpg" +"14276" "Is there direct contact between the frisbee and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14276.jpg" +"14277" "Is there direct contact between the woman and banana?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14277.jpg" +"14278" "Is there direct contact between the woman and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14278.jpg" +"14279" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14279.jpg" +"14280" "Is there direct contact between the lounge and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14280.jpg" +"14281" "Is there direct contact between the umbrella and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14281.jpg" +"14282" "Is there direct contact between the cat and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14282.jpg" +"14283" "Is there direct contact between the cat and tap?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14283.jpg" +"14284" "Is there direct contact between the keyboard and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14284.jpg" +"14285" "Is there direct contact between the hydrant and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14285.jpg" +"14286" "Is there direct contact between the kettle and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14286.jpg" +"14287" "Is there direct contact between the kettle and flower?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14287.jpg" +"14288" "Is there direct contact between the cat and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14288.jpg" +"14289" "Is there direct contact between the cat and electrombile?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14289.jpg" +"14290" "Is there direct contact between the orange and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14290.jpg" +"14291" "Is there direct contact between the orange and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14291.jpg" +"14292" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14292.jpg" +"14293" "Is there direct contact between the sheep and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14293.jpg" +"14294" "Is there direct contact between the tap and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14294.jpg" +"14295" "Is there direct contact between the tap and light?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14295.jpg" +"14296" "Is there direct contact between the tree and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14296.jpg" +"14297" "Is there direct contact between the bench and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14297.jpg" +"14298" "Is there direct contact between the cat and toilet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14298.jpg" +"14299" "Is there direct contact between the cat and brush?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14299.jpg" +"14300" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14300.jpg" +"14301" "Is there direct contact between the car and building?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14301.jpg" +"14302" "Is there direct contact between the pigeon and telescope?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14302.jpg" +"14303" "Is there direct contact between the pigeon and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14303.jpg" +"14304" "Is there direct contact between the motorbike and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14304.jpg" +"14305" "Is there direct contact between the motorbike and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14305.jpg" +"14306" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14306.jpg" +"14307" "Is there direct contact between the bus and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14307.jpg" +"14308" "Is there direct contact between the tissue and holder?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14308.jpg" +"14309" "Is there direct contact between the bin and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14309.jpg" +"14310" "Is there direct contact between the vase and flower?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14310.jpg" +"14311" "Is there direct contact between the light and mirror?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14311.jpg" +"14312" "Is there direct contact between the pizza and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14312.jpg" +"14313" "Is there direct contact between the pizza and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14313.jpg" +"14314" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14314.jpg" +"14315" "Is there direct contact between the giraffe and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14315.jpg" +"14316" "Is there direct contact between the apple and knife?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14316.jpg" +"14317" "Is there direct contact between the knife and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14317.jpg" +"14318" "Is there direct contact between the hot and grill?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14318.jpg" +"14319" "Is there direct contact between the hot and charcoal?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14319.jpg" +"14320" "Is there direct contact between the pigeon and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14320.jpg" +"14321" "Is there direct contact between the table and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14321.jpg" +"14322" "Is there direct contact between the laptop and computer?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14322.jpg" +"14323" "Is there direct contact between the table and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14323.jpg" +"14324" "Is there direct contact between the laptop and wine?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14324.jpg" +"14325" "Is there direct contact between the boy and bat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14325.jpg" +"14326" "Is there direct contact between the boy and man?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14326.jpg" +"14327" "Is there direct contact between the grass and ball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14327.jpg" +"14328" "Is there direct contact between the man and woman?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14328.jpg" +"14329" "Is there direct contact between the dog and electrombile?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14329.jpg" +"14330" "Is there direct contact between the dog and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14330.jpg" +"14331" "Is there direct contact between the cake and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14331.jpg" +"14332" "Is there direct contact between the doughnut and box?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14332.jpg" +"14333" "Is there direct contact between the doughnut and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14333.jpg" +"14334" "Is there direct contact between the dog and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14334.jpg" +"14335" "Is there direct contact between the toy and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14335.jpg" +"14336" "Is there direct contact between the boy and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14336.jpg" +"14337" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14337.jpg" +"14338" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14338.jpg" +"14339" "Is there direct contact between the sign and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14339.jpg" +"14340" "Is there direct contact between the bus and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14340.jpg" +"14341" "Is there direct contact between the bus and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14341.jpg" +"14342" "Is there direct contact between the dog and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14342.jpg" +"14343" "Is there direct contact between the dog and bench?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14343.jpg" +"14344" "Is there direct contact between the bicycle and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14344.jpg" +"14345" "Is there direct contact between the bicycle and hydrant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14345.jpg" +"14346" "Is there direct contact between the cat and luggage?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14346.jpg" +"14347" "Is there direct contact between the cat and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14347.jpg" +"14348" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14348.jpg" +"14349" "Is there direct contact between the person and bus?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14349.jpg" +"14350" "Is there direct contact between the person and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14350.jpg" +"14351" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14351.jpg" +"14352" "Is there direct contact between the sheep and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14352.jpg" +"14353" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14353.jpg" +"14354" "Is there direct contact between the person and horse?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14354.jpg" +"14355" "Is there direct contact between the refrigerator and cabinet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14355.jpg" +"14356" "Is there direct contact between the refrigerator and microwave?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14356.jpg" +"14357" "Is there direct contact between the bag and bag?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14357.jpg" +"14358" "Is there direct contact between the tomato and carrot?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14358.jpg" +"14359" "Is there direct contact between the broccoli and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14359.jpg" +"14360" "Is there direct contact between the tree and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14360.jpg" +"14361" "Is there direct contact between the grass and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14361.jpg" +"14362" "Is there direct contact between the notebook and support?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14362.jpg" +"14363" "Is there direct contact between the keyboard and mouse?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14363.jpg" +"14364" "Is there direct contact between the horse and saddle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14364.jpg" +"14365" "Is there direct contact between the saddle and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14365.jpg" +"14366" "Is there direct contact between the pillow and quilt?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14366.jpg" +"14367" "Is there direct contact between the pillow and drawing?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14367.jpg" +"14368" "Is there direct contact between the apple and orange?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14368.jpg" +"14369" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14369.jpg" +"14370" "Is there direct contact between the bench and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14370.jpg" +"14371" "Is there direct contact between the banana and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14371.jpg" +"14372" "Is there direct contact between the pillow and quilt?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14372.jpg" +"14373" "Is there direct contact between the pillow and lamp?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14373.jpg" +"14374" "Is there direct contact between the snowboard and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14374.jpg" +"14375" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14375.jpg" +"14376" "Is there direct contact between the grass and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14376.jpg" +"14377" "Is there direct contact between the tree and bench?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14377.jpg" +"14378" "Is there direct contact between the train and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14378.jpg" +"14379" "Is there direct contact between the train and board?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14379.jpg" +"14380" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14380.jpg" +"14381" "Is there direct contact between the train and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14381.jpg" +"14382" "Is there direct contact between the baggage and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14382.jpg" +"14383" "Is there direct contact between the cone and hydrant?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14383.jpg" +"14384" "Is there direct contact between the bicycle and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14384.jpg" +"14385" "Is there direct contact between the bicycle and zebra?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14385.jpg" +"14386" "Is there direct contact between the cherry and orange?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14386.jpg" +"14387" "Is there direct contact between the cherry and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14387.jpg" +"14388" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14388.jpg" +"14389" "Is there direct contact between the bench and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14389.jpg" +"14390" "Is there direct contact between the rice and box?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14390.jpg" +"14391" "Is there direct contact between the rice and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14391.jpg" +"14392" "Is there direct contact between the bus and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14392.jpg" +"14393" "Is there direct contact between the bus and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14393.jpg" +"14394" "Is there direct contact between the bus and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14394.jpg" +"14395" "Is there direct contact between the bus and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14395.jpg" +"14396" "Is there direct contact between the dog and skate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14396.jpg" +"14397" "Is there direct contact between the dog and sofa?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14397.jpg" +"14398" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14398.jpg" +"14399" "Is there direct contact between the ship and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14399.jpg" +"14400" "Is there direct contact between the banana and tangerine?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14400.jpg" +"14401" "Is there direct contact between the pear and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14401.jpg" +"14402" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14402.jpg" +"14403" "Is there direct contact between the giraffe and bush?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14403.jpg" +"14404" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14404.jpg" +"14405" "Is there direct contact between the sea and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14405.jpg" +"14406" "Is there direct contact between the sea and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14406.jpg" +"14407" "Is there direct contact between the sofa and woman?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14407.jpg" +"14408" "Is there direct contact between the woman and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14408.jpg" +"14409" "Is there direct contact between the sea and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14409.jpg" +"14410" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14410.jpg" +"14411" "Is there direct contact between the floor and computer?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14411.jpg" +"14412" "Is there direct contact between the floor and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14412.jpg" +"14413" "Is there direct contact between the keyboard and bread?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14413.jpg" +"14414" "Is there direct contact between the plate and bread?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14414.jpg" +"14415" "Is there direct contact between the ground and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14415.jpg" +"14416" "Is there direct contact between the car and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14416.jpg" +"14417" "Is there direct contact between the motorbike and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14417.jpg" +"14418" "Is there direct contact between the motorbike and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14418.jpg" +"14419" "Is there direct contact between the pole and sign?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14419.jpg" +"14420" "Is there direct contact between the man and frisbee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14420.jpg" +"14421" "Is there direct contact between the man and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14421.jpg" +"14422" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14422.jpg" +"14423" "Is there direct contact between the cow and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14423.jpg" +"14424" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14424.jpg" +"14425" "Is there direct contact between the tree and sign?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14425.jpg" +"14426" "Is there direct contact between the tap and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14426.jpg" +"14427" "Is there direct contact between the tap and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14427.jpg" +"14428" "Is there direct contact between the pizza and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14428.jpg" +"14429" "Is there direct contact between the pizza and fork?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14429.jpg" +"14430" "Is there direct contact between the child and ball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14430.jpg" +"14431" "Is there direct contact between the man and child?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14431.jpg" +"14432" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14432.jpg" +"14433" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14433.jpg" +"14434" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14434.jpg" +"14435" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14435.jpg" +"14436" "Is there direct contact between the woman and sofa?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14436.jpg" +"14437" "Is there direct contact between the sofa and notebook?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14437.jpg" +"14438" "Is there direct contact between the banana and scoon?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14438.jpg" +"14439" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14439.jpg" +"14440" "Is there direct contact between the giraffe and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14440.jpg" +"14441" "Is there direct contact between the child and umbrella?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14441.jpg" +"14442" "Is there direct contact between the umbrella and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14442.jpg" +"14443" "Is there direct contact between the person and kite?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14443.jpg" +"14444" "Is there direct contact between the child and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14444.jpg" +"14445" "Is there direct contact between the child and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14445.jpg" +"14446" "Is there direct contact between the banana and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14446.jpg" +"14447" "Is there direct contact between the knife and tablecloth?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14447.jpg" +"14448" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14448.jpg" +"14449" "Is there direct contact between the dog and doghole?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14449.jpg" +"14450" "Is there direct contact between the dog and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14450.jpg" +"14451" "Is there direct contact between the bread and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14451.jpg" +"14452" "Is there direct contact between the car and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14452.jpg" +"14453" "Is there direct contact between the horse and road?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14453.jpg" +"14454" "Is there direct contact between the duck and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14454.jpg" +"14455" "Is there direct contact between the plane and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14455.jpg" +"14456" "Is there direct contact between the pot and cooktop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14456.jpg" +"14457" "Is there direct contact between the microwave and pot?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14457.jpg" +"14458" "Is there direct contact between the flower and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14458.jpg" +"14459" "Is there direct contact between the house and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14459.jpg" +"14460" "Is there direct contact between the cat and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14460.jpg" +"14461" "Is there direct contact between the cat and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14461.jpg" +"14462" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14462.jpg" +"14463" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14463.jpg" +"14464" "Is there direct contact between the person and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14464.jpg" +"14465" "Is there direct contact between the person and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14465.jpg" +"14466" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14466.jpg" +"14467" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14467.jpg" +"14468" "Is there direct contact between the kite and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14468.jpg" +"14469" "Is there direct contact between the bird and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14469.jpg" +"14470" "Is there direct contact between the bird and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14470.jpg" +"14471" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14471.jpg" +"14472" "Is there direct contact between the forest and plane?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14472.jpg" +"14473" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14473.jpg" +"14474" "Is there direct contact between the cloud and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14474.jpg" +"14475" "Is there direct contact between the person and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14475.jpg" +"14476" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14476.jpg" +"14477" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14477.jpg" +"14478" "Is there direct contact between the grass and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14478.jpg" +"14479" "Is there direct contact between the frisbee and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14479.jpg" +"14480" "Is there direct contact between the bear and river?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14480.jpg" +"14481" "Is there direct contact between the forest and river?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14481.jpg" +"14482" "Is there direct contact between the toy and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14482.jpg" +"14483" "Is there direct contact between the toy and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14483.jpg" +"14484" "Is there direct contact between the skate and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14484.jpg" +"14485" "Is there direct contact between the dog and skate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14485.jpg" +"14486" "Is there direct contact between the toilet and bin?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14486.jpg" +"14487" "Is there direct contact between the floor and toilet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14487.jpg" +"14488" "Is there direct contact between the cloud and kite?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14488.jpg" +"14489" "Is there direct contact between the laptop and sofa?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14489.jpg" +"14490" "Is there direct contact between the woman and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14490.jpg" +"14491" "Is there direct contact between the frisbee and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14491.jpg" +"14492" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14492.jpg" +"14493" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14493.jpg" +"14494" "Is there direct contact between the tangerine and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14494.jpg" +"14495" "Is there direct contact between the chicken and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14495.jpg" +"14496" "Is there direct contact between the chicken and fence?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14496.jpg" +"14497" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14497.jpg" +"14498" "Is there direct contact between the person and snow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14498.jpg" +"14499" "Is there direct contact between the person and umbrella?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14499.jpg" +"14500" "Is there direct contact between the umbrella and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14500.jpg" +"14501" "Is there direct contact between the duck and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14501.jpg" +"14502" "Is there direct contact between the duck and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14502.jpg" +"14503" "Is there direct contact between the person and pulp?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14503.jpg" +"14504" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14504.jpg" +"14505" "Is there direct contact between the giraffe and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14505.jpg" +"14506" "Is there direct contact between the banana and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14506.jpg" +"14507" "Is there direct contact between the doll and banana?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14507.jpg" +"14508" "Is there direct contact between the woman and pole?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14508.jpg" +"14509" "Is there direct contact between the plate and banana?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14509.jpg" +"14510" "Is there direct contact between the banana and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14510.jpg" +"14511" "Is there direct contact between the bowl and scoon?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14511.jpg" +"14512" "Is there direct contact between the scoon and egg?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14512.jpg" +"14513" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14513.jpg" +"14514" "Is there direct contact between the person and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14514.jpg" +"14515" "Is there direct contact between the tennis and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14515.jpg" +"14516" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14516.jpg" +"14517" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14517.jpg" +"14518" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14518.jpg" +"14519" "Is there direct contact between the car and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14519.jpg" +"14520" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14520.jpg" +"14521" "Is there direct contact between the sign and wire?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14521.jpg" +"14522" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14522.jpg" +"14523" "Is there direct contact between the truck and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14523.jpg" +"14524" "Is there direct contact between the cushion and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14524.jpg" +"14525" "Is there direct contact between the tissue and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14525.jpg" +"14526" "Is there direct contact between the bear and river?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14526.jpg" +"14527" "Is there direct contact between the bear and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14527.jpg" +"14528" "Is there direct contact between the horse and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14528.jpg" +"14529" "Is there direct contact between the horse and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14529.jpg" +"14530" "Is there direct contact between the motorbike and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14530.jpg" +"14531" "Is there direct contact between the dog and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14531.jpg" +"14532" "Is there direct contact between the board and knife?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14532.jpg" +"14533" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14533.jpg" +"14534" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14534.jpg" +"14535" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14535.jpg" +"14536" "Is there direct contact between the banana and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14536.jpg" +"14537" "Is there direct contact between the apple and lemon?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14537.jpg" +"14538" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14538.jpg" +"14539" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14539.jpg" +"14540" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14540.jpg" +"14541" "Is there direct contact between the bird and pizza?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14541.jpg" +"14542" "Is there direct contact between the phone and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14542.jpg" +"14543" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14543.jpg" +"14544" "Is there direct contact between the giraffe and lion?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14544.jpg" +"14545" "Is there direct contact between the person and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14545.jpg" +"14546" "Is there direct contact between the racket and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14546.jpg" +"14547" "Is there direct contact between the dog and frisbee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14547.jpg" +"14548" "Is there direct contact between the frisbee and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14548.jpg" +"14549" "Is there direct contact between the person and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14549.jpg" +"14550" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14550.jpg" +"14551" "Is there direct contact between the bread and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14551.jpg" +"14552" "Is there direct contact between the umbrella and lounge?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14552.jpg" +"14553" "Is there direct contact between the umbrella and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14553.jpg" +"14554" "Is there direct contact between the apple and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14554.jpg" +"14555" "Is there direct contact between the pear and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14555.jpg" +"14556" "Is there direct contact between the fork and bread?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14556.jpg" +"14557" "Is there direct contact between the train and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14557.jpg" +"14558" "Is there direct contact between the grass and train?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14558.jpg" +"14559" "Is there direct contact between the giraffe and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14559.jpg" +"14560" "Is there direct contact between the plane and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14560.jpg" +"14561" "Is there direct contact between the person and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14561.jpg" +"14562" "Is there direct contact between the racket and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14562.jpg" +"14563" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14563.jpg" +"14564" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14564.jpg" +"14565" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14565.jpg" +"14566" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14566.jpg" +"14567" "Is there direct contact between the laptop and support?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14567.jpg" +"14568" "Is there direct contact between the keyboard and card?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14568.jpg" +"14569" "Is there direct contact between the tree and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14569.jpg" +"14570" "Is there direct contact between the sea and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14570.jpg" +"14571" "Is there direct contact between the knife and orange?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14571.jpg" +"14572" "Is there direct contact between the forest and sign?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14572.jpg" +"14573" "Is there direct contact between the person and baseball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14573.jpg" +"14574" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14574.jpg" +"14575" "Is there direct contact between the person and baseball?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14575.jpg" +"14576" "Is there direct contact between the cat and dog?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14576.jpg" +"14577" "Is there direct contact between the dog and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14577.jpg" +"14578" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14578.jpg" +"14579" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14579.jpg" +"14580" "Is there direct contact between the ship and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14580.jpg" +"14581" "Is there direct contact between the ship and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14581.jpg" +"14582" "Is there direct contact between the mouse and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14582.jpg" +"14583" "Is there direct contact between the monitor and keyboard?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14583.jpg" +"14584" "Is there direct contact between the dog and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14584.jpg" +"14585" "Is there direct contact between the dog and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14585.jpg" +"14586" "Is there direct contact between the person and snowboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14586.jpg" +"14587" "Is there direct contact between the person and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14587.jpg" +"14588" "Is there direct contact between the bath and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14588.jpg" +"14589" "Is there direct contact between the bath and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14589.jpg" +"14590" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14590.jpg" +"14591" "Is there direct contact between the person and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14591.jpg" +"14592" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14592.jpg" +"14593" "Is there direct contact between the dog and frisbee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14593.jpg" +"14594" "Is there direct contact between the frisbee and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14594.jpg" +"14595" "Is there direct contact between the bear and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14595.jpg" +"14596" "Is there direct contact between the house and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14596.jpg" +"14597" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14597.jpg" +"14598" "Is there direct contact between the bench and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14598.jpg" +"14599" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14599.jpg" +"14600" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14600.jpg" +"14601" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14601.jpg" +"14602" "Is there direct contact between the bench and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14602.jpg" +"14603" "Is there direct contact between the truck and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14603.jpg" +"14604" "Is there direct contact between the truck and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14604.jpg" +"14605" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14605.jpg" +"14606" "Is there direct contact between the person and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14606.jpg" +"14607" "Is there direct contact between the apple and banana?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14607.jpg" +"14608" "Is there direct contact between the toy and banana?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14608.jpg" +"14609" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14609.jpg" +"14610" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14610.jpg" +"14611" "Is there direct contact between the dog and frisbee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14611.jpg" +"14612" "Is there direct contact between the frisbee and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14612.jpg" +"14613" "Is there direct contact between the person and skate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14613.jpg" +"14614" "Is there direct contact between the motorbike and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14614.jpg" +"14615" "Is there direct contact between the motorbike and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14615.jpg" +"14616" "Is there direct contact between the pulp and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14616.jpg" +"14617" "Is there direct contact between the pulp and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14617.jpg" +"14618" "Is there direct contact between the doll and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14618.jpg" +"14619" "Is there direct contact between the doll and door?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14619.jpg" +"14620" "Is there direct contact between the table and mouse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14620.jpg" +"14621" "Is there direct contact between the mouse and apple?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14621.jpg" +"14622" "Is there direct contact between the mirror and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14622.jpg" +"14623" "Is there direct contact between the mirror and toothbrush?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14623.jpg" +"14624" "Is there direct contact between the doll and controller?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14624.jpg" +"14625" "Is there direct contact between the doll and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14625.jpg" +"14626" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14626.jpg" +"14627" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14627.jpg" +"14628" "Is there direct contact between the cat and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14628.jpg" +"14629" "Is there direct contact between the cat and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14629.jpg" +"14630" "Is there direct contact between the keyboard and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14630.jpg" +"14631" "Is there direct contact between the keyboard and notebook?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14631.jpg" +"14632" "Is there direct contact between the tangerine and apple?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14632.jpg" +"14633" "Is there direct contact between the apple and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14633.jpg" +"14634" "Is there direct contact between the duck and river?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14634.jpg" +"14635" "Is there direct contact between the duck and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14635.jpg" +"14636" "Is there direct contact between the dog and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14636.jpg" +"14637" "Is there direct contact between the motorbike and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14637.jpg" +"14638" "Is there direct contact between the motorbike and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14638.jpg" +"14639" "Is there direct contact between the cat and shoe?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14639.jpg" +"14640" "Is there direct contact between the cat and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14640.jpg" +"14641" "Is there direct contact between the cat and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14641.jpg" +"14642" "Is there direct contact between the cat and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14642.jpg" +"14643" "Is there direct contact between the bread and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14643.jpg" +"14644" "Is there direct contact between the person and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14644.jpg" +"14645" "Is there direct contact between the racket and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14645.jpg" +"14646" "Is there direct contact between the banana and tangerine?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14646.jpg" +"14647" "Is there direct contact between the banana and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14647.jpg" +"14648" "Is there direct contact between the banana and paper?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14648.jpg" +"14649" "Is there direct contact between the banana and pen?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14649.jpg" +"14650" "Is there direct contact between the dog and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14650.jpg" +"14651" "Is there direct contact between the motorbike and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14651.jpg" +"14652" "Is there direct contact between the motorbike and river?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14652.jpg" +"14653" "Is there direct contact between the keyboard and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14653.jpg" +"14654" "Is there direct contact between the keyboard and mouse?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14654.jpg" +"14655" "Is there direct contact between the elephant and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14655.jpg" +"14656" "Is there direct contact between the elephant and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14656.jpg" +"14657" "Is there direct contact between the bird and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14657.jpg" +"14658" "Is there direct contact between the bird and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14658.jpg" +"14659" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14659.jpg" +"14660" "Is there direct contact between the cat and controller?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14660.jpg" +"14661" "Is there direct contact between the microwave and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14661.jpg" +"14662" "Is there direct contact between the microwave and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14662.jpg" +"14663" "Is there direct contact between the giraffe and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14663.jpg" +"14664" "Is there direct contact between the dog and blanket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14664.jpg" +"14665" "Is there direct contact between the person and dog?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14665.jpg" +"14666" "Is there direct contact between the dog and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14666.jpg" +"14667" "Is there direct contact between the person and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14667.jpg" +"14668" "Is there direct contact between the person and bus?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14668.jpg" +"14669" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14669.jpg" +"14670" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14670.jpg" +"14671" "Is there direct contact between the signal and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14671.jpg" +"14672" "Is there direct contact between the signal and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14672.jpg" +"14673" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14673.jpg" +"14674" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14674.jpg" +"14675" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14675.jpg" +"14676" "Is there direct contact between the person and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14676.jpg" +"14677" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14677.jpg" +"14678" "Is there direct contact between the person and rail?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14678.jpg" +"14679" "Is there direct contact between the hydrant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14679.jpg" +"14680" "Is there direct contact between the hydrant and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14680.jpg" +"14681" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14681.jpg" +"14682" "Is there direct contact between the mountain and sign?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14682.jpg" +"14683" "Is there direct contact between the orange and bowl?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14683.jpg" +"14684" "Is there direct contact between the orange and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14684.jpg" +"14685" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14685.jpg" +"14686" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14686.jpg" +"14687" "Is there direct contact between the train and river?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14687.jpg" +"14688" "Is there direct contact between the person and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14688.jpg" +"14689" "Is there direct contact between the umbrella and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14689.jpg" +"14690" "Is there direct contact between the bench and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14690.jpg" +"14691" "Is there direct contact between the sea and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14691.jpg" +"14692" "Is there direct contact between the dog and controller?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14692.jpg" +"14693" "Is there direct contact between the controller and blanket?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14693.jpg" +"14694" "Is there direct contact between the bird and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14694.jpg" +"14695" "Is there direct contact between the bird and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14695.jpg" +"14696" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14696.jpg" +"14697" "Is there direct contact between the person and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14697.jpg" +"14698" "Is there direct contact between the umbrella and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14698.jpg" +"14699" "Is there direct contact between the umbrella and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14699.jpg" +"14700" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14700.jpg" +"14701" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14701.jpg" +"14702" "Is there direct contact between the sheep and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14702.jpg" +"14703" "Is there direct contact between the sheep and fence?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14703.jpg" +"14704" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14704.jpg" +"14705" "Is there direct contact between the bench and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14705.jpg" +"14706" "Is there direct contact between the broccoli and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14706.jpg" +"14707" "Is there direct contact between the shrimp and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14707.jpg" +"14708" "Is there direct contact between the sign and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14708.jpg" +"14709" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14709.jpg" +"14710" "Is there direct contact between the sea and surfboard?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14710.jpg" +"14711" "Is there direct contact between the cup and juice?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14711.jpg" +"14712" "Is there direct contact between the wall and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14712.jpg" +"14713" "Is there direct contact between the racket and tennis?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14713.jpg" +"14714" "Is there direct contact between the tennis and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14714.jpg" +"14715" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14715.jpg" +"14716" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14716.jpg" +"14717" "Is there direct contact between the dog and toilet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14717.jpg" +"14718" "Is there direct contact between the dog and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14718.jpg" +"14719" "Is there direct contact between the tree and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14719.jpg" +"14720" "Is there direct contact between the sign and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14720.jpg" +"14721" "Is there direct contact between the horse and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14721.jpg" +"14722" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14722.jpg" +"14723" "Is there direct contact between the person and keyboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14723.jpg" +"14724" "Is there direct contact between the keyboard and book?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14724.jpg" +"14725" "Is there direct contact between the dog and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14725.jpg" +"14726" "Is there direct contact between the dog and car?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14726.jpg" +"14727" "Is there direct contact between the giraffe and sky?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14727.jpg" +"14728" "Is there direct contact between the bath and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14728.jpg" +"14729" "Is there direct contact between the toilet and window?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14729.jpg" +"14730" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14730.jpg" +"14731" "Is there direct contact between the tree and giraffe?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14731.jpg" +"14732" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14732.jpg" +"14733" "Is there direct contact between the person and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14733.jpg" +"14734" "Is there direct contact between the sink and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14734.jpg" +"14735" "Is there direct contact between the sink and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14735.jpg" +"14736" "Is there direct contact between the dog and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14736.jpg" +"14737" "Is there direct contact between the dog and tennis?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14737.jpg" +"14738" "Is there direct contact between the lemon and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14738.jpg" +"14739" "Is there direct contact between the grapefruit and lemon?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14739.jpg" +"14740" "Is there direct contact between the person and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14740.jpg" +"14741" "Is there direct contact between the racket and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14741.jpg" +"14742" "Is there direct contact between the door and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14742.jpg" +"14743" "Is there direct contact between the door and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14743.jpg" +"14744" "Is there direct contact between the banana and tangerine?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14744.jpg" +"14745" "Is there direct contact between the person and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14745.jpg" +"14746" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14746.jpg" +"14747" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14747.jpg" +"14748" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14748.jpg" +"14749" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14749.jpg" +"14750" "Is there direct contact between the cat and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14750.jpg" +"14751" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14751.jpg" +"14752" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14752.jpg" +"14753" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14753.jpg" +"14754" "Is there direct contact between the truck and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14754.jpg" +"14755" "Is there direct contact between the table and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14755.jpg" +"14756" "Is there direct contact between the cup and keyboard?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14756.jpg" +"14757" "Is there direct contact between the carrot and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14757.jpg" +"14758" "Is there direct contact between the carrot and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14758.jpg" +"14759" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14759.jpg" +"14760" "Is there direct contact between the dog and frisbee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14760.jpg" +"14761" "Is there direct contact between the frisbee and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14761.jpg" +"14762" "Is there direct contact between the child and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14762.jpg" +"14763" "Is there direct contact between the child and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14763.jpg" +"14764" "Is there direct contact between the plane and sky?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14764.jpg" +"14765" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14765.jpg" +"14766" "Is there direct contact between the sea and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14766.jpg" +"14767" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14767.jpg" +"14768" "Is there direct contact between the sea and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14768.jpg" +"14769" "Is there direct contact between the giraffe and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14769.jpg" +"14770" "Is there direct contact between the cat and sink?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14770.jpg" +"14771" "Is there direct contact between the cat and tap?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14771.jpg" +"14772" "Is there direct contact between the dog and carpet?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14772.jpg" +"14773" "Is there direct contact between the dog and mirror?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14773.jpg" +"14774" "Is there direct contact between the cat and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14774.jpg" +"14775" "Is there direct contact between the broccoli and tomato?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14775.jpg" +"14776" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14776.jpg" +"14777" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14777.jpg" +"14778" "Is there direct contact between the banana and tangerine?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14778.jpg" +"14779" "Is there direct contact between the fence and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14779.jpg" +"14780" "Is there direct contact between the fence and hydrant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14780.jpg" +"14781" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14781.jpg" +"14782" "Is there direct contact between the floor and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14782.jpg" +"14783" "Is there direct contact between the woman and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14783.jpg" +"14784" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14784.jpg" +"14785" "Is there direct contact between the dog and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14785.jpg" +"14786" "Is there direct contact between the duck and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14786.jpg" +"14787" "Is there direct contact between the duck and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14787.jpg" +"14788" "Is there direct contact between the dog and bottle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14788.jpg" +"14789" "Is there direct contact between the bottle and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14789.jpg" +"14790" "Is there direct contact between the elephant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14790.jpg" +"14791" "Is there direct contact between the elephant and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14791.jpg" +"14792" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14792.jpg" +"14793" "Is there direct contact between the man and racket?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14793.jpg" +"14794" "Is there direct contact between the racket and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14794.jpg" +"14795" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14795.jpg" +"14796" "Is there direct contact between the refrigerator and wall?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14796.jpg" +"14797" "Is there direct contact between the refrigerator and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14797.jpg" +"14798" "Is there direct contact between the umbrella and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14798.jpg" +"14799" "Is there direct contact between the lounge and umbrella?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14799.jpg" +"14800" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14800.jpg" +"14801" "Is there direct contact between the ground and bench?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14801.jpg" +"14802" "Is there direct contact between the man and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14802.jpg" +"14803" "Is there direct contact between the man and plane?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14803.jpg" +"14804" "Is there direct contact between the giraffe and bird?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14804.jpg" +"14805" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14805.jpg" +"14806" "Is there direct contact between the dog and frisbee?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14806.jpg" +"14807" "Is there direct contact between the frisbee and football?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14807.jpg" +"14808" "Is there direct contact between the man and kite?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14808.jpg" +"14809" "Is there direct contact between the kite and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14809.jpg" +"14810" "Is there direct contact between the refrigerator and window?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14810.jpg" +"14811" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14811.jpg" +"14812" "Is there direct contact between the dog and person?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14812.jpg" +"14813" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14813.jpg" +"14814" "Is there direct contact between the cow and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14814.jpg" +"14815" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14815.jpg" +"14816" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14816.jpg" +"14817" "Is there direct contact between the person and horse?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14817.jpg" +"14818" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14818.jpg" +"14819" "Is there direct contact between the person and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14819.jpg" +"14820" "Is there direct contact between the elephant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14820.jpg" +"14821" "Is there direct contact between the tap and showerpuff?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14821.jpg" +"14822" "Is there direct contact between the tap and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14822.jpg" +"14823" "Is there direct contact between the person and kite?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14823.jpg" +"14824" "Is there direct contact between the child and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14824.jpg" +"14825" "Is there direct contact between the child and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14825.jpg" +"14826" "Is there direct contact between the grass and cow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14826.jpg" +"14827" "Is there direct contact between the horse and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14827.jpg" +"14828" "Is there direct contact between the horse and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14828.jpg" +"14829" "Is there direct contact between the dog and umbrella?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14829.jpg" +"14830" "Is there direct contact between the man and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14830.jpg" +"14831" "Is there direct contact between the man and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14831.jpg" +"14832" "Is there direct contact between the bird and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14832.jpg" +"14833" "Is there direct contact between the bird and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14833.jpg" +"14834" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14834.jpg" +"14835" "Is there direct contact between the bird and core?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14835.jpg" +"14836" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14836.jpg" +"14837" "Is there direct contact between the bench and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14837.jpg" +"14838" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14838.jpg" +"14839" "Is there direct contact between the giraffe and man?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14839.jpg" +"14840" "Is there direct contact between the horse and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14840.jpg" +"14841" "Is there direct contact between the ship and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14841.jpg" +"14842" "Is there direct contact between the ship and sun?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14842.jpg" +"14843" "Is there direct contact between the umbrella and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14843.jpg" +"14844" "Is there direct contact between the umbrella and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14844.jpg" +"14845" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14845.jpg" +"14846" "Is there direct contact between the giraffe and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14846.jpg" +"14847" "Is there direct contact between the cake and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14847.jpg" +"14848" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14848.jpg" +"14849" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14849.jpg" +"14850" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14850.jpg" +"14851" "Is there direct contact between the panda and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14851.jpg" +"14852" "Is there direct contact between the lemon and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14852.jpg" +"14853" "Is there direct contact between the lemon and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14853.jpg" +"14854" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14854.jpg" +"14855" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14855.jpg" +"14856" "Is there direct contact between the lake and goose?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14856.jpg" +"14857" "Is there direct contact between the pizza and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14857.jpg" +"14858" "Is there direct contact between the microwave and book?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14858.jpg" +"14859" "Is there direct contact between the bottle and microwave?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14859.jpg" +"14860" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14860.jpg" +"14861" "Is there direct contact between the rope and hydrant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14861.jpg" +"14862" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14862.jpg" +"14863" "Is there direct contact between the car and elephant?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14863.jpg" +"14864" "Is there direct contact between the flower and vase?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14864.jpg" +"14865" "Is there direct contact between the apple and sticker?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14865.jpg" +"14866" "Is there direct contact between the hydrant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14866.jpg" +"14867" "Is there direct contact between the hydrant and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14867.jpg" +"14868" "Is there direct contact between the bear and sofa?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14868.jpg" +"14869" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14869.jpg" +"14870" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14870.jpg" +"14871" "Is there direct contact between the elephant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14871.jpg" +"14872" "Is there direct contact between the man and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14872.jpg" +"14873" "Is there direct contact between the man and ship?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14873.jpg" +"14874" "Is there direct contact between the man and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14874.jpg" +"14875" "Is there direct contact between the hat and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14875.jpg" +"14876" "Is there direct contact between the bread and tissue?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14876.jpg" +"14877" "Is there direct contact between the bread and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14877.jpg" +"14878" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14878.jpg" +"14879" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14879.jpg" +"14880" "Is there direct contact between the train and rail?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14880.jpg" +"14881" "Is there direct contact between the train and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14881.jpg" +"14882" "Is there direct contact between the hydrant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14882.jpg" +"14883" "Is there direct contact between the hat and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14883.jpg" +"14884" "Is there direct contact between the pizza and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14884.jpg" +"14885" "Is there direct contact between the person and tie?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14885.jpg" +"14886" "Is there direct contact between the cat and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14886.jpg" +"14887" "Is there direct contact between the child and bat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14887.jpg" +"14888" "Is there direct contact between the bat and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14888.jpg" +"14889" "Is there direct contact between the table and controller?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14889.jpg" +"14890" "Is there direct contact between the grass and sheep?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14890.jpg" +"14891" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14891.jpg" +"14892" "Is there direct contact between the zebra and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14892.jpg" +"14893" "Is there direct contact between the table and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14893.jpg" +"14894" "Is there direct contact between the pen and glass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14894.jpg" +"14895" "Is there direct contact between the surfboard and man?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14895.jpg" +"14896" "Is there direct contact between the man and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14896.jpg" +"14897" "Is there direct contact between the snowboard and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14897.jpg" +"14898" "Is there direct contact between the snowboard and pole?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14898.jpg" +"14899" "Is there direct contact between the train and man?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14899.jpg" +"14900" "Is there direct contact between the train and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14900.jpg" +"14901" "Is there direct contact between the horse and man?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14901.jpg" +"14902" "Is there direct contact between the horse and dog?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14902.jpg" +"14903" "Is there direct contact between the bird and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14903.jpg" +"14904" "Is there direct contact between the bird and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14904.jpg" +"14905" "Is there direct contact between the bird and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14905.jpg" +"14906" "Is there direct contact between the woman and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14906.jpg" +"14907" "Is there direct contact between the dog and cow?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14907.jpg" +"14908" "Is there direct contact between the dog and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14908.jpg" +"14909" "Is there direct contact between the dog and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14909.jpg" +"14910" "Is there direct contact between the pizza and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14910.jpg" +"14911" "Is there direct contact between the pizza and floor?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14911.jpg" +"14912" "Is there direct contact between the man and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14912.jpg" +"14913" "Is there direct contact between the hat and motorbike?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14913.jpg" +"14914" "Is there direct contact between the banana and bowl?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14914.jpg" +"14915" "Is there direct contact between the giraffe and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14915.jpg" +"14916" "Is there direct contact between the giraffe and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14916.jpg" +"14917" "Is there direct contact between the person and motorbike?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14917.jpg" +"14918" "Is there direct contact between the person and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14918.jpg" +"14919" "Is there direct contact between the tangerine and leave?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14919.jpg" +"14920" "Is there direct contact between the mouse and mousepad?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14920.jpg" +"14921" "Is there direct contact between the cup and laptop?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14921.jpg" +"14922" "Is there direct contact between the banana and tinfoil?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14922.jpg" +"14923" "Is there direct contact between the banana and pear?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14923.jpg" +"14924" "Is there direct contact between the sofa and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14924.jpg" +"14925" "Is there direct contact between the laptop and toy?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14925.jpg" +"14926" "Is there direct contact between the ship and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14926.jpg" +"14927" "Is there direct contact between the cat and television?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14927.jpg" +"14928" "Is there direct contact between the cat and air-conditioning?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14928.jpg" +"14929" "Is there direct contact between the cat and umbrella?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14929.jpg" +"14930" "Is there direct contact between the apple and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14930.jpg" +"14931" "Is there direct contact between the apple and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14931.jpg" +"14932" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14932.jpg" +"14933" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14933.jpg" +"14934" "Is there direct contact between the wall and clock?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14934.jpg" +"14935" "Is there direct contact between the clock and ceiling?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14935.jpg" +"14936" "Is there direct contact between the sea and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14936.jpg" +"14937" "Is there direct contact between the umbrella and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14937.jpg" +"14938" "Is there direct contact between the sink and tap?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14938.jpg" +"14939" "Is there direct contact between the mirror and toilet?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14939.jpg" +"14940" "Is there direct contact between the banana and tangerine?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14940.jpg" +"14941" "Is there direct contact between the man and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14941.jpg" +"14942" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14942.jpg" +"14943" "Is there direct contact between the person and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14943.jpg" +"14944" "Is there direct contact between the bench and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14944.jpg" +"14945" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14945.jpg" +"14946" "Is there direct contact between the tennis and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14946.jpg" +"14947" "Is there direct contact between the bird and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14947.jpg" +"14948" "Is there direct contact between the ship and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14948.jpg" +"14949" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14949.jpg" +"14950" "Is there direct contact between the bench and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14950.jpg" +"14951" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14951.jpg" +"14952" "Is there direct contact between the sea and parasail?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14952.jpg" +"14953" "Is there direct contact between the bird and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14953.jpg" +"14954" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14954.jpg" +"14955" "Is there direct contact between the man and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14955.jpg" +"14956" "Is there direct contact between the bear and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14956.jpg" +"14957" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14957.jpg" +"14958" "Is there direct contact between the hydrant and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14958.jpg" +"14959" "Is there direct contact between the cow and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14959.jpg" +"14960" "Is there direct contact between the cow and ship?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14960.jpg" +"14961" "Is there direct contact between the banana and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14961.jpg" +"14962" "Is there direct contact between the banana and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14962.jpg" +"14963" "Is there direct contact between the cat and box?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14963.jpg" +"14964" "Is there direct contact between the box and cushion?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14964.jpg" +"14965" "Is there direct contact between the bench and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14965.jpg" +"14966" "Is there direct contact between the bench and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14966.jpg" +"14967" "Is there direct contact between the dog and bottle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14967.jpg" +"14968" "Is there direct contact between the bottle and tennis?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14968.jpg" +"14969" "Is there direct contact between the bread and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14969.jpg" +"14970" "Is there direct contact between the bread and tablecloth?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14970.jpg" +"14971" "Is there direct contact between the train and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14971.jpg" +"14972" "Is there direct contact between the zebra and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14972.jpg" +"14973" "Is there direct contact between the toothbrush and toy?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14973.jpg" +"14974" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14974.jpg" +"14975" "Is there direct contact between the cow and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14975.jpg" +"14976" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14976.jpg" +"14977" "Is there direct contact between the umbrella and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14977.jpg" +"14978" "Is there direct contact between the cow and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14978.jpg" +"14979" "Is there direct contact between the cow and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14979.jpg" +"14980" "Is there direct contact between the laptop and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14980.jpg" +"14981" "Is there direct contact between the glass and pen?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14981.jpg" +"14982" "Is there direct contact between the man and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14982.jpg" +"14983" "Is there direct contact between the man and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14983.jpg" +"14984" "Is there direct contact between the woman and desert?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14984.jpg" +"14985" "Is there direct contact between the glass and book?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14985.jpg" +"14986" "Is there direct contact between the mountain and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14986.jpg" +"14987" "Is there direct contact between the grass and eagle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14987.jpg" +"14988" "Is there direct contact between the sea and mountain?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14988.jpg" +"14989" "Is there direct contact between the person and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14989.jpg" +"14990" "Is there direct contact between the person and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14990.jpg" +"14991" "Is there direct contact between the man and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14991.jpg" +"14992" "Is there direct contact between the laptop and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14992.jpg" +"14993" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14993.jpg" +"14994" "Is there direct contact between the woman and chair?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14994.jpg" +"14995" "Is there direct contact between the woman and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14995.jpg" +"14996" "Is there direct contact between the mountain and river?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14996.jpg" +"14997" "Is there direct contact between the moon and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14997.jpg" +"14998" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14998.jpg" +"14999" "Is there direct contact between the ship and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/14999.jpg" +"15000" "Is there direct contact between the grass and cow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15000.jpg" +"15001" "Is there direct contact between the cow and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15001.jpg" +"15002" "Is there direct contact between the sheep and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15002.jpg" +"15003" "Is there direct contact between the grape and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15003.jpg" +"15004" "Is there direct contact between the grape and wine?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15004.jpg" +"15005" "Is there direct contact between the child and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15005.jpg" +"15006" "Is there direct contact between the child and pineapple?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15006.jpg" +"15007" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15007.jpg" +"15008" "Is there direct contact between the car and house?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15008.jpg" +"15009" "Is there direct contact between the tortoise and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15009.jpg" +"15010" "Is there direct contact between the tortoise and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15010.jpg" +"15011" "Is there direct contact between the person and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15011.jpg" +"15012" "Is there direct contact between the cup and book?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15012.jpg" +"15013" "Is there direct contact between the house and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15013.jpg" +"15014" "Is there direct contact between the house and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15014.jpg" +"15015" "Is there direct contact between the man and laptop?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15015.jpg" +"15016" "Is there direct contact between the man and curtain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15016.jpg" +"15017" "Is there direct contact between the bowl and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15017.jpg" +"15018" "Is there direct contact between the bowl and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15018.jpg" +"15019" "Is there direct contact between the cola and refrigerator?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15019.jpg" +"15020" "Is there direct contact between the sky and plane?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15020.jpg" +"15021" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15021.jpg" +"15022" "Is there direct contact between the ship and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15022.jpg" +"15023" "Is there direct contact between the sky and sun?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15023.jpg" +"15024" "Is there direct contact between the man and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15024.jpg" +"15025" "Is there direct contact between the lake and tent?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15025.jpg" +"15026" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15026.jpg" +"15027" "Is there direct contact between the person and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15027.jpg" +"15028" "Is there direct contact between the building and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15028.jpg" +"15029" "Is there direct contact between the man and watch?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15029.jpg" +"15030" "Is there direct contact between the watch and chair?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15030.jpg" +"15031" "Is there direct contact between the woman and bicycle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15031.jpg" +"15032" "Is there direct contact between the woman and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15032.jpg" +"15033" "Is there direct contact between the ground and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15033.jpg" +"15034" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15034.jpg" +"15035" "Is there direct contact between the forest and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15035.jpg" +"15036" "Is there direct contact between the cat and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15036.jpg" +"15037" "Is there direct contact between the horse and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15037.jpg" +"15038" "Is there direct contact between the horse and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15038.jpg" +"15039" "Is there direct contact between the lounge and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15039.jpg" +"15040" "Is there direct contact between the umbrella and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15040.jpg" +"15041" "Is there direct contact between the sea and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15041.jpg" +"15042" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15042.jpg" +"15043" "Is there direct contact between the ground and car?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15043.jpg" +"15044" "Is there direct contact between the car and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15044.jpg" +"15045" "Is there direct contact between the pear and leave?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15045.jpg" +"15046" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15046.jpg" +"15047" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15047.jpg" +"15048" "Is there direct contact between the banana and bread?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15048.jpg" +"15049" "Is there direct contact between the man and woman?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15049.jpg" +"15050" "Is there direct contact between the man and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15050.jpg" +"15051" "Is there direct contact between the car and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15051.jpg" +"15052" "Is there direct contact between the woman and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15052.jpg" +"15053" "Is there direct contact between the woman and car?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15053.jpg" +"15054" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15054.jpg" +"15055" "Is there direct contact between the deer and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15055.jpg" +"15056" "Is there direct contact between the deer and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15056.jpg" +"15057" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15057.jpg" +"15058" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15058.jpg" +"15059" "Is there direct contact between the cloud and building?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15059.jpg" +"15060" "Is there direct contact between the person and surfboard?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15060.jpg" +"15061" "Is there direct contact between the flower and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15061.jpg" +"15062" "Is there direct contact between the grass and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15062.jpg" +"15063" "Is there direct contact between the forest and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15063.jpg" +"15064" "Is there direct contact between the person and ship?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15064.jpg" +"15065" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15065.jpg" +"15066" "Is there direct contact between the pen and notebook?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15066.jpg" +"15067" "Is there direct contact between the pen and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15067.jpg" +"15068" "Is there direct contact between the train and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15068.jpg" +"15069" "Is there direct contact between the train and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15069.jpg" +"15070" "Is there direct contact between the cat and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15070.jpg" +"15071" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15071.jpg" +"15072" "Is there direct contact between the dog and desert?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15072.jpg" +"15073" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15073.jpg" +"15074" "Is there direct contact between the shoe and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15074.jpg" +"15075" "Is there direct contact between the woman and camera?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15075.jpg" +"15076" "Is there direct contact between the camera and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15076.jpg" +"15077" "Is there direct contact between the grass and mountain?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15077.jpg" +"15078" "Is there direct contact between the phone and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15078.jpg" +"15079" "Is there direct contact between the phone and cup?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15079.jpg" +"15080" "Is there direct contact between the fox and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15080.jpg" +"15081" "Is there direct contact between the fox and forest?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15081.jpg" +"15082" "Is there direct contact between the goose and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15082.jpg" +"15083" "Is there direct contact between the goose and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15083.jpg" +"15084" "Is there direct contact between the cup and lemon?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15084.jpg" +"15085" "Is there direct contact between the woman and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15085.jpg" +"15086" "Is there direct contact between the tree and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15086.jpg" +"15087" "Is there direct contact between the grass and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15087.jpg" +"15088" "Is there direct contact between the man and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15088.jpg" +"15089" "Is there direct contact between the dog and man?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15089.jpg" +"15090" "Is there direct contact between the table and pad?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15090.jpg" +"15091" "Is there direct contact between the pad and watch?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15091.jpg" +"15092" "Is there direct contact between the car and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15092.jpg" +"15093" "Is there direct contact between the car and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15093.jpg" +"15094" "Is there direct contact between the house and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15094.jpg" +"15095" "Is there direct contact between the man and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15095.jpg" +"15096" "Is there direct contact between the man and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15096.jpg" +"15097" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15097.jpg" +"15098" "Is there direct contact between the ship and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15098.jpg" +"15099" "Is there direct contact between the sky and signal?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15099.jpg" +"15100" "Is there direct contact between the bird and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15100.jpg" +"15101" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15101.jpg" +"15102" "Is there direct contact between the house and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15102.jpg" +"15103" "Is there direct contact between the woman and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15103.jpg" +"15104" "Is there direct contact between the woman and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15104.jpg" +"15105" "Is there direct contact between the grass and flower?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15105.jpg" +"15106" "Is there direct contact between the mushroom and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15106.jpg" +"15107" "Is there direct contact between the pen and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15107.jpg" +"15108" "Is there direct contact between the pen and book?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15108.jpg" +"15109" "Is there direct contact between the bridge and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15109.jpg" +"15110" "Is there direct contact between the chair and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15110.jpg" +"15111" "Is there direct contact between the chair and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15111.jpg" +"15112" "Is there direct contact between the cup and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15112.jpg" +"15113" "Is there direct contact between the cup and table?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15113.jpg" +"15114" "Is there direct contact between the grass and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15114.jpg" +"15115" "Is there direct contact between the tree and cloud?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15115.jpg" +"15116" "Is there direct contact between the person and paddle?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15116.jpg" +"15117" "Is there direct contact between the tree and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15117.jpg" +"15118" "Is there direct contact between the elephant and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15118.jpg" +"15119" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15119.jpg" +"15120" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15120.jpg" +"15121" "Is there direct contact between the dog and sofa?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15121.jpg" +"15122" "Is there direct contact between the dog and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15122.jpg" +"15123" "Is there direct contact between the notebook and pen?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15123.jpg" +"15124" "Is there direct contact between the pen and watch?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15124.jpg" +"15125" "Is there direct contact between the forest and bridge?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15125.jpg" +"15126" "Is there direct contact between the man and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15126.jpg" +"15127" "Is there direct contact between the sea and man?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15127.jpg" +"15128" "Is there direct contact between the forest and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15128.jpg" +"15129" "Is there direct contact between the island and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15129.jpg" +"15130" "Is there direct contact between the person and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15130.jpg" +"15131" "Is there direct contact between the ship and sea?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15131.jpg" +"15132" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15132.jpg" +"15133" "Is there direct contact between the woman and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15133.jpg" +"15134" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15134.jpg" +"15135" "Is there direct contact between the tree and lion?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15135.jpg" +"15136" "Is there direct contact between the person and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15136.jpg" +"15137" "Is there direct contact between the person and sea?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15137.jpg" +"15138" "Is there direct contact between the beach and tortoise?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15138.jpg" +"15139" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15139.jpg" +"15140" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15140.jpg" +"15141" "Is there direct contact between the woman and hat?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15141.jpg" +"15142" "Is there direct contact between the woman and island?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15142.jpg" +"15143" "Is there direct contact between the person and bench?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15143.jpg" +"15144" "Is there direct contact between the person and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15144.jpg" +"15145" "Is there direct contact between the dog and beach?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15145.jpg" +"15146" "Is there direct contact between the dog and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15146.jpg" +"15147" "Is there direct contact between the dog and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15147.jpg" +"15148" "Is there direct contact between the dog and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15148.jpg" +"15149" "Is there direct contact between the dog and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15149.jpg" +"15150" "Is there direct contact between the duck and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15150.jpg" +"15151" "Is there direct contact between the duck and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15151.jpg" +"15152" "Is there direct contact between the goose and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15152.jpg" +"15153" "Is there direct contact between the goose and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15153.jpg" +"15154" "Is there direct contact between the duck and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15154.jpg" +"15155" "Is there direct contact between the fish and lake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15155.jpg" +"15156" "Is there direct contact between the flower and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15156.jpg" +"15157" "Is there direct contact between the flower and vase?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15157.jpg" +"15158" "Is there direct contact between the flower and tablecloth?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15158.jpg" +"15159" "Is there direct contact between the cup and tablecloth?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15159.jpg" +"15160" "Is there direct contact between the cup and grapefruit?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15160.jpg" +"15161" "Is there direct contact between the house and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15161.jpg" +"15162" "Is there direct contact between the lemon and board?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15162.jpg" +"15163" "Is there direct contact between the lemon and grapefruit?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15163.jpg" +"15164" "Is there direct contact between the shrimp and ice?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15164.jpg" +"15165" "Is there direct contact between the shrimp and lemon?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15165.jpg" +"15166" "Is there direct contact between the cup and water?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15166.jpg" +"15167" "Is there direct contact between the lion and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15167.jpg" +"15168" "Is there direct contact between the lion and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15168.jpg" +"15169" "Is there direct contact between the tiger and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15169.jpg" +"15170" "Is there direct contact between the car and tiger?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15170.jpg" +"15171" "Is there direct contact between the lion and stone?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15171.jpg" +"15172" "Is there direct contact between the forest and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15172.jpg" +"15173" "Is there direct contact between the tangerine and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15173.jpg" +"15174" "Is there direct contact between the tangerine and tree?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15174.jpg" +"15175" "Is there direct contact between the tangerine and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15175.jpg" +"15176" "Is there direct contact between the wall and drawing?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15176.jpg" +"15177" "Is there direct contact between the pig and person?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15177.jpg" +"15178" "Is there direct contact between the pig and fence?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15178.jpg" +"15179" "Is there direct contact between the skate and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15179.jpg" +"15180" "Is there direct contact between the watermelon and board?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15180.jpg" +"15181" "Is there direct contact between the lemon and tablecloth?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15181.jpg" +"15182" "Is there direct contact between the plate and table?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15182.jpg" +"15183" "Is there direct contact between the rabbit and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15183.jpg" +"15184" "Is there direct contact between the rabbit and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15184.jpg" +"15185" "Is there direct contact between the cola and refrigerator?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15185.jpg" +"15186" "Is there direct contact between the lake and forest?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15186.jpg" +"15187" "Is there direct contact between the river and mountain?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15187.jpg" +"15188" "Is there direct contact between the sand and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15188.jpg" +"15189" "Is there direct contact between the forest and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15189.jpg" +"15190" "Is there direct contact between the road and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15190.jpg" +"15191" "Is there direct contact between the mountain and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15191.jpg" +"15192" "Is there direct contact between the ground and snow?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15192.jpg" +"15193" "Is there direct contact between the ground and sign?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15193.jpg" +"15194" "Is there direct contact between the sign and grass?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15194.jpg" +"15195" "Is there direct contact between the strawberry and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15195.jpg" +"15196" "Is there direct contact between the strawberry and cake?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15196.jpg" +"15197" "Is there direct contact between the wall and candle?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15197.jpg" +"15198" "Is there direct contact between the car and ground?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15198.jpg" +"15199" "Is there direct contact between the ground and road?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15199.jpg" +"15200" "Is there direct contact between the table and floor?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15200.jpg" +"15201" "Is there direct contact between the tiger and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15201.jpg" +"15202" "Is there direct contact between the tiger and stone?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15202.jpg" +"15203" "Is there direct contact between the tiger and ground?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15203.jpg" +"15204" "Is there direct contact between the tiger and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15204.jpg" +"15205" "Is there direct contact between the tiger and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15205.jpg" +"15206" "Is there direct contact between the tiger and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15206.jpg" +"15207" "Is there direct contact between the tiger and lake?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15207.jpg" +"15208" "Is there direct contact between the tree and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15208.jpg" +"15209" "Is there direct contact between the sky and cloud?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15209.jpg" +"15210" "Is there direct contact between the car and grass?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15210.jpg" +"15211" "Is there direct contact between the car and mountain?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15211.jpg" +"15212" "Is there direct contact between the person and volleyball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15212.jpg" +"15213" "Is there direct contact between the volleyball and beach?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15213.jpg" +"15214" "Is there direct contact between the person and volleyball?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15214.jpg" +"15215" "Is there direct contact between the volleyball and tree?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15215.jpg" +"15216" "Is there direct contact between the watermelon and plate?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15216.jpg" +"15217" "Is there direct contact between the scoon and fork?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15217.jpg" +"15218" "Is there direct contact between the person and watermelon?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15218.jpg" +"15219" "Is there direct contact between the man and cup?" "yes" "discriminative-relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15219.jpg" +"15220" "Is there direct contact between the cup and wall?" "no" "relation" "/simple-eval-dataset-loader-dev/dataset/vlmevalkit/images/AMBER/15220.jpg"