[ { "height": 640, "width": 427, "id": 0, "original_id": 1719310, "dataset_name": "refcoco", "area": 14863.615599999997, "iscrowd": 0, "image_id": 0, "category_id": 1, "bbox_list": [ [ 103.93, 299.99, 237.15, 476.40999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581857.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the lady with the blue shirt.", "normal_caption": "the lady with the blue shirt", "solution": [ 103.93, 299.99, 238.15, 477.41 ], "normalized_solution": [ 243, 468, 557, 745 ] }, { "height": 640, "width": 427, "id": 1, "original_id": 1719310, "dataset_name": "refcoco", "area": 14863.615599999997, "iscrowd": 0, "image_id": 1, "category_id": 1, "bbox_list": [ [ 103.93, 299.99, 237.15, 476.40999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581857.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady with back to us.", "normal_caption": "lady with back to us", "solution": [ 103.93, 299.99, 238.15, 477.41 ], "normalized_solution": [ 243, 468, 557, 745 ] }, { "height": 640, "width": 427, "id": 2, "original_id": 1719310, "dataset_name": "refcoco", "area": 14863.615599999997, "iscrowd": 0, "image_id": 2, "category_id": 1, "bbox_list": [ [ 103.93, 299.99, 237.15, 476.40999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581857.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue shirt.", "normal_caption": "blue shirt", "solution": [ 103.93, 299.99, 238.15, 477.41 ], "normalized_solution": [ 243, 468, 557, 745 ] }, { "height": 640, "width": 427, "id": 3, "original_id": 463958, "dataset_name": "refcoco", "area": 10352.277800000005, "iscrowd": 0, "image_id": 3, "category_id": 1, "bbox_list": [ [ 216.58, 261.7, 297.22, 472.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581857.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in gray shirt facing camera on right.", "normal_caption": "woman in gray shirt facing camera on right", "solution": [ 216.58, 261.7, 298.22, 473.59 ], "normalized_solution": [ 507, 408, 698, 739 ] }, { "height": 640, "width": 427, "id": 4, "original_id": 463958, "dataset_name": "refcoco", "area": 10352.277800000005, "iscrowd": 0, "image_id": 4, "category_id": 1, "bbox_list": [ [ 216.58, 261.7, 297.22, 472.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581857.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman gray right.", "normal_caption": "woman gray right", "solution": [ 216.58, 261.7, 298.22, 473.59 ], "normalized_solution": [ 507, 408, 698, 739 ] }, { "height": 640, "width": 427, "id": 5, "original_id": 463958, "dataset_name": "refcoco", "area": 10352.277800000005, "iscrowd": 0, "image_id": 5, "category_id": 1, "bbox_list": [ [ 216.58, 261.7, 297.22, 472.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581857.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman greyshirt right.", "normal_caption": "woman greyshirt right", "solution": [ 216.58, 261.7, 298.22, 473.59 ], "normalized_solution": [ 507, 408, 698, 739 ] }, { "height": 640, "width": 466, "id": 6, "original_id": 495152, "dataset_name": "refcoco", "area": 12851.723550000002, "iscrowd": 0, "image_id": 6, "category_id": 1, "bbox_list": [ [ 170.75, 91.57, 253.8, 335.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581839.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person standing u.", "normal_caption": "person standing u", "solution": [ 170.75, 91.57, 254.8, 336.98 ], "normalized_solution": [ 366, 143, 546, 526 ] }, { "height": 640, "width": 466, "id": 7, "original_id": 495152, "dataset_name": "refcoco", "area": 12851.723550000002, "iscrowd": 0, "image_id": 7, "category_id": 1, "bbox_list": [ [ 170.75, 91.57, 253.8, 335.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581839.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: standing.", "normal_caption": "standing", "solution": [ 170.75, 91.57, 254.8, 336.98 ], "normalized_solution": [ 366, 143, 546, 526 ] }, { "height": 640, "width": 466, "id": 8, "original_id": 495152, "dataset_name": "refcoco", "area": 12851.723550000002, "iscrowd": 0, "image_id": 8, "category_id": 1, "bbox_list": [ [ 170.75, 91.57, 253.8, 335.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581839.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle standing up.", "normal_caption": "middle standing up", "solution": [ 170.75, 91.57, 254.8, 336.98 ], "normalized_solution": [ 366, 143, 546, 526 ] }, { "height": 640, "width": 466, "id": 9, "original_id": 485695, "dataset_name": "refcoco", "area": 15520.162500000002, "iscrowd": 0, "image_id": 9, "category_id": 1, "bbox_list": [ [ 114.57, 237.84, 319.83, 416.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581839.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady sitting on right.", "normal_caption": "lady sitting on right", "solution": [ 114.57, 237.84, 320.83, 417.49 ], "normalized_solution": [ 245, 371, 688, 652 ] }, { "height": 640, "width": 466, "id": 10, "original_id": 485695, "dataset_name": "refcoco", "area": 15520.162500000002, "iscrowd": 0, "image_id": 10, "category_id": 1, "bbox_list": [ [ 114.57, 237.84, 319.83, 416.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581839.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right girl on floor.", "normal_caption": "right girl on floor", "solution": [ 114.57, 237.84, 320.83, 417.49 ], "normalized_solution": [ 245, 371, 688, 652 ] }, { "height": 640, "width": 466, "id": 11, "original_id": 485695, "dataset_name": "refcoco", "area": 15520.162500000002, "iscrowd": 0, "image_id": 11, "category_id": 1, "bbox_list": [ [ 114.57, 237.84, 319.83, 416.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581839.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman sitting on right.", "normal_caption": "woman sitting on right", "solution": [ 114.57, 237.84, 320.83, 417.49 ], "normalized_solution": [ 245, 371, 688, 652 ] }, { "height": 423, "width": 640, "id": 12, "original_id": 453177, "dataset_name": "refcoco", "area": 32988.456150000005, "iscrowd": 0, "image_id": 12, "category_id": 1, "bbox_list": [ [ 39.33, 95.92, 326.08, 404.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581789.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 39.33, 95.92, 327.08, 405.73 ], "normalized_solution": [ 61, 226, 511, 959 ] }, { "height": 423, "width": 640, "id": 13, "original_id": 453177, "dataset_name": "refcoco", "area": 32988.456150000005, "iscrowd": 0, "image_id": 13, "category_id": 1, "bbox_list": [ [ 39.33, 95.92, 326.08, 404.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581789.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left person.", "normal_caption": "left person", "solution": [ 39.33, 95.92, 327.08, 405.73 ], "normalized_solution": [ 61, 226, 511, 959 ] }, { "height": 423, "width": 640, "id": 14, "original_id": 453177, "dataset_name": "refcoco", "area": 32988.456150000005, "iscrowd": 0, "image_id": 14, "category_id": 1, "bbox_list": [ [ 39.33, 95.92, 326.08, 404.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581789.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman under suitcase.", "normal_caption": "woman under suitcase", "solution": [ 39.33, 95.92, 327.08, 405.73 ], "normalized_solution": [ 61, 226, 511, 959 ] }, { "height": 423, "width": 640, "id": 15, "original_id": 440706, "dataset_name": "refcoco", "area": 88732.272, "iscrowd": 0, "image_id": 15, "category_id": 1, "bbox_list": [ [ 109.26, 60.98, 577.9200000000001, 418.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581789.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in jacket.", "normal_caption": "man in jacket", "solution": [ 109.26, 60.98, 578.92, 419.87 ], "normalized_solution": [ 170, 144, 904, 992 ] }, { "height": 423, "width": 640, "id": 16, "original_id": 440706, "dataset_name": "refcoco", "area": 88732.272, "iscrowd": 0, "image_id": 16, "category_id": 1, "bbox_list": [ [ 109.26, 60.98, 577.9200000000001, 418.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581789.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man trying to help with suitcase.", "normal_caption": "man trying to help with suitcase", "solution": [ 109.26, 60.98, 578.92, 419.87 ], "normalized_solution": [ 170, 144, 904, 992 ] }, { "height": 423, "width": 640, "id": 17, "original_id": 440706, "dataset_name": "refcoco", "area": 88732.272, "iscrowd": 0, "image_id": 17, "category_id": 1, "bbox_list": [ [ 109.26, 60.98, 577.9200000000001, 418.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581789.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 109.26, 60.98, 578.92, 419.87 ], "normalized_solution": [ 170, 144, 904, 992 ] }, { "height": 375, "width": 500, "id": 18, "original_id": 1097431, "dataset_name": "refcoco", "area": 11487.5681, "iscrowd": 0, "image_id": 18, "category_id": 70, "bbox_list": [ [ 19.47, 149.62, 126.82, 283.21000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left most toilet.", "normal_caption": "left most toilet", "solution": [ 19.47, 149.62, 127.82, 284.21 ], "normalized_solution": [ 38, 398, 255, 757 ] }, { "height": 375, "width": 500, "id": 19, "original_id": 1097431, "dataset_name": "refcoco", "area": 11487.5681, "iscrowd": 0, "image_id": 19, "category_id": 70, "bbox_list": [ [ 19.47, 149.62, 126.82, 283.21000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far left toilet.", "normal_caption": "far left toilet", "solution": [ 19.47, 149.62, 127.82, 284.21 ], "normalized_solution": [ 38, 398, 255, 757 ] }, { "height": 375, "width": 500, "id": 20, "original_id": 1097431, "dataset_name": "refcoco", "area": 11487.5681, "iscrowd": 0, "image_id": 20, "category_id": 70, "bbox_list": [ [ 19.47, 149.62, 126.82, 283.21000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left urinal.", "normal_caption": "left urinal", "solution": [ 19.47, 149.62, 127.82, 284.21 ], "normalized_solution": [ 38, 398, 255, 757 ] }, { "height": 375, "width": 500, "id": 21, "original_id": 1093269, "dataset_name": "refcoco", "area": 11540.7888, "iscrowd": 0, "image_id": 21, "category_id": 70, "bbox_list": [ [ 372.47, 75.84, 477.65000000000003, 277.09000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right stall.", "normal_caption": "right stall", "solution": [ 372.47, 75.84, 478.65, 278.09 ], "normalized_solution": [ 744, 202, 957, 741 ] }, { "height": 375, "width": 500, "id": 22, "original_id": 1093269, "dataset_name": "refcoco", "area": 11540.7888, "iscrowd": 0, "image_id": 22, "category_id": 70, "bbox_list": [ [ 372.47, 75.84, 477.65000000000003, 277.09000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right urinal.", "normal_caption": "right urinal", "solution": [ 372.47, 75.84, 478.65, 278.09 ], "normalized_solution": [ 744, 202, 957, 741 ] }, { "height": 375, "width": 500, "id": 23, "original_id": 1093269, "dataset_name": "refcoco", "area": 11540.7888, "iscrowd": 0, "image_id": 23, "category_id": 70, "bbox_list": [ [ 372.47, 75.84, 477.65000000000003, 277.09000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right urinal.", "normal_caption": "right urinal", "solution": [ 372.47, 75.84, 478.65, 278.09 ], "normalized_solution": [ 744, 202, 957, 741 ] }, { "height": 480, "width": 640, "id": 24, "original_id": 1154905, "dataset_name": "refcoco", "area": 12996.479449999992, "iscrowd": 0, "image_id": 24, "category_id": 86, "bbox_list": [ [ 375.0, 148.16, 483.26, 443.84000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right vase.", "normal_caption": "right vase", "solution": [ 375.0, 148.16, 484.26, 444.84 ], "normalized_solution": [ 585, 308, 756, 926 ] }, { "height": 480, "width": 640, "id": 25, "original_id": 1154905, "dataset_name": "refcoco", "area": 12996.479449999992, "iscrowd": 0, "image_id": 25, "category_id": 86, "bbox_list": [ [ 375.0, 148.16, 483.26, 443.84000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right most vase.", "normal_caption": "right most vase", "solution": [ 375.0, 148.16, 484.26, 444.84 ], "normalized_solution": [ 585, 308, 756, 926 ] }, { "height": 480, "width": 640, "id": 26, "original_id": 1152539, "dataset_name": "refcoco", "area": 16159.573249999992, "iscrowd": 0, "image_id": 26, "category_id": 86, "bbox_list": [ [ 265.35, 143.46, 380.84000000000003, 452.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle vase.", "normal_caption": "middle vase", "solution": [ 265.35, 143.46, 381.84, 453.03 ], "normalized_solution": [ 414, 298, 596, 943 ] }, { "height": 480, "width": 640, "id": 27, "original_id": 1152539, "dataset_name": "refcoco", "area": 16159.573249999992, "iscrowd": 0, "image_id": 27, "category_id": 86, "bbox_list": [ [ 265.35, 143.46, 380.84000000000003, 452.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle.", "normal_caption": "middle", "solution": [ 265.35, 143.46, 381.84, 453.03 ], "normalized_solution": [ 414, 298, 596, 943 ] }, { "height": 480, "width": 640, "id": 28, "original_id": 1152539, "dataset_name": "refcoco", "area": 16159.573249999992, "iscrowd": 0, "image_id": 28, "category_id": 86, "bbox_list": [ [ 265.35, 143.46, 380.84000000000003, 452.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: center vase.", "normal_caption": "center vase", "solution": [ 265.35, 143.46, 381.84, 453.03 ], "normalized_solution": [ 414, 298, 596, 943 ] }, { "height": 480, "width": 640, "id": 29, "original_id": 1151495, "dataset_name": "refcoco", "area": 14672.066150000002, "iscrowd": 0, "image_id": 29, "category_id": 86, "bbox_list": [ [ 151.01, 142.23, 264.13, 452.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left vase.", "normal_caption": "left vase", "solution": [ 151.01, 142.23, 265.13, 453.89 ], "normalized_solution": [ 235, 296, 414, 945 ] }, { "height": 480, "width": 640, "id": 30, "original_id": 1151495, "dataset_name": "refcoco", "area": 14672.066150000002, "iscrowd": 0, "image_id": 30, "category_id": 86, "bbox_list": [ [ 151.01, 142.23, 264.13, 452.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581739.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left vase.", "normal_caption": "left vase", "solution": [ 151.01, 142.23, 265.13, 453.89 ], "normalized_solution": [ 235, 296, 414, 945 ] }, { "height": 427, "width": 640, "id": 31, "original_id": 247896, "dataset_name": "refcoco", "area": 17798.32135, "iscrowd": 0, "image_id": 31, "category_id": 6, "bbox_list": [ [ 15.21, 165.15, 188.9, 290.08000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581738.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bus on the left.", "normal_caption": "bus on the left", "solution": [ 15.21, 165.15, 189.9, 291.08 ], "normalized_solution": [ 23, 386, 296, 681 ] }, { "height": 427, "width": 640, "id": 32, "original_id": 247896, "dataset_name": "refcoco", "area": 17798.32135, "iscrowd": 0, "image_id": 32, "category_id": 6, "bbox_list": [ [ 15.21, 165.15, 188.9, 290.08000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581738.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left buss.", "normal_caption": "left buss", "solution": [ 15.21, 165.15, 189.9, 291.08 ], "normalized_solution": [ 23, 386, 296, 681 ] }, { "height": 427, "width": 640, "id": 33, "original_id": 247896, "dataset_name": "refcoco", "area": 17798.32135, "iscrowd": 0, "image_id": 33, "category_id": 6, "bbox_list": [ [ 15.21, 165.15, 188.9, 290.08000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581738.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red bus on the left.", "normal_caption": "red bus on the left", "solution": [ 15.21, 165.15, 189.9, 291.08 ], "normalized_solution": [ 23, 386, 296, 681 ] }, { "height": 427, "width": 640, "id": 34, "original_id": 165092, "dataset_name": "refcoco", "area": 50646.498799999994, "iscrowd": 0, "image_id": 34, "category_id": 6, "bbox_list": [ [ 176.39, 164.58, 571.55, 319.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581738.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bus in front.", "normal_caption": "bus in front", "solution": [ 176.39, 164.58, 572.55, 320.73 ], "normalized_solution": [ 275, 385, 894, 751 ] }, { "height": 427, "width": 640, "id": 35, "original_id": 165092, "dataset_name": "refcoco", "area": 50646.498799999994, "iscrowd": 0, "image_id": 35, "category_id": 6, "bbox_list": [ [ 176.39, 164.58, 571.55, 319.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581738.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right bus.", "normal_caption": "right bus", "solution": [ 176.39, 164.58, 572.55, 320.73 ], "normalized_solution": [ 275, 385, 894, 751 ] }, { "height": 427, "width": 640, "id": 36, "original_id": 165092, "dataset_name": "refcoco", "area": 50646.498799999994, "iscrowd": 0, "image_id": 36, "category_id": 6, "bbox_list": [ [ 176.39, 164.58, 571.55, 319.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581738.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: whole bus.", "normal_caption": "whole bus", "solution": [ 176.39, 164.58, 572.55, 320.73 ], "normalized_solution": [ 275, 385, 894, 751 ] }, { "height": 357, "width": 500, "id": 37, "original_id": 2204728, "dataset_name": "refcoco", "area": 10461.951299999999, "iscrowd": 0, "image_id": 37, "category_id": 1, "bbox_list": [ [ 72.95, 221.86, 211.06, 356.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the head just behind the girl on leftin the middle.", "normal_caption": "the head just behind the girl on leftin the middle", "solution": [ 72.95, 221.86, 212.06, 357.0 ], "normalized_solution": [ 145, 621, 424, 1000 ] }, { "height": 357, "width": 500, "id": 38, "original_id": 2204728, "dataset_name": "refcoco", "area": 10461.951299999999, "iscrowd": 0, "image_id": 38, "category_id": 1, "bbox_list": [ [ 72.95, 221.86, 211.06, 356.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl with no cap on.", "normal_caption": "girl with no cap on", "solution": [ 72.95, 221.86, 212.06, 357.0 ], "normalized_solution": [ 145, 621, 424, 1000 ] }, { "height": 357, "width": 500, "id": 39, "original_id": 2204728, "dataset_name": "refcoco", "area": 10461.951299999999, "iscrowd": 0, "image_id": 39, "category_id": 1, "bbox_list": [ [ 72.95, 221.86, 211.06, 356.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brown hair coming out of girls chin.", "normal_caption": "brown hair coming out of girls chin", "solution": [ 72.95, 221.86, 212.06, 357.0 ], "normalized_solution": [ 145, 621, 424, 1000 ] }, { "height": 357, "width": 500, "id": 40, "original_id": 516523, "dataset_name": "refcoco", "area": 25073.177799999994, "iscrowd": 0, "image_id": 40, "category_id": 1, "bbox_list": [ [ 0.81, 104.56, 160.98, 351.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left kid.", "normal_caption": "left kid", "solution": [ 0.81, 104.56, 161.98, 352.77 ], "normalized_solution": [ 1, 292, 323, 988 ] }, { "height": 357, "width": 500, "id": 41, "original_id": 516523, "dataset_name": "refcoco", "area": 25073.177799999994, "iscrowd": 0, "image_id": 41, "category_id": 1, "bbox_list": [ [ 0.81, 104.56, 160.98, 351.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player left.", "normal_caption": "player left", "solution": [ 0.81, 104.56, 161.98, 352.77 ], "normalized_solution": [ 1, 292, 323, 988 ] }, { "height": 357, "width": 500, "id": 42, "original_id": 516523, "dataset_name": "refcoco", "area": 25073.177799999994, "iscrowd": 0, "image_id": 42, "category_id": 1, "bbox_list": [ [ 0.81, 104.56, 160.98, 351.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left player front.", "normal_caption": "left player front", "solution": [ 0.81, 104.56, 161.98, 352.77 ], "normalized_solution": [ 1, 292, 323, 988 ] }, { "height": 357, "width": 500, "id": 43, "original_id": 511746, "dataset_name": "refcoco", "area": 69806.85174999999, "iscrowd": 0, "image_id": 43, "category_id": 1, "bbox_list": [ [ 141.51, 2.41, 471.78, 351.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy.", "normal_caption": "boy", "solution": [ 141.51, 2.41, 472.78, 352.18 ], "normalized_solution": [ 283, 6, 945, 986 ] }, { "height": 357, "width": 500, "id": 44, "original_id": 511746, "dataset_name": "refcoco", "area": 69806.85174999999, "iscrowd": 0, "image_id": 44, "category_id": 1, "bbox_list": [ [ 141.51, 2.41, 471.78, 351.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid looking at you.", "normal_caption": "kid looking at you", "solution": [ 141.51, 2.41, 472.78, 352.18 ], "normalized_solution": [ 283, 6, 945, 986 ] }, { "height": 357, "width": 500, "id": 45, "original_id": 511746, "dataset_name": "refcoco", "area": 69806.85174999999, "iscrowd": 0, "image_id": 45, "category_id": 1, "bbox_list": [ [ 141.51, 2.41, 471.78, 351.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581719.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy front.", "normal_caption": "boy front", "solution": [ 141.51, 2.41, 472.78, 352.18 ], "normalized_solution": [ 283, 6, 945, 986 ] }, { "height": 425, "width": 640, "id": 46, "original_id": 41223, "dataset_name": "refcoco", "area": 18244.189499999993, "iscrowd": 0, "image_id": 46, "category_id": 16, "bbox_list": [ [ 402.15, 255.0, 602.23, 419.43 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581686.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bird on right.", "normal_caption": "bird on right", "solution": [ 402.15, 255.0, 603.23, 420.43 ], "normalized_solution": [ 628, 600, 942, 989 ] }, { "height": 425, "width": 640, "id": 47, "original_id": 41223, "dataset_name": "refcoco", "area": 18244.189499999993, "iscrowd": 0, "image_id": 47, "category_id": 16, "bbox_list": [ [ 402.15, 255.0, 602.23, 419.43 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581686.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right bird.", "normal_caption": "right bird", "solution": [ 402.15, 255.0, 603.23, 420.43 ], "normalized_solution": [ 628, 600, 942, 989 ] }, { "height": 425, "width": 640, "id": 48, "original_id": 41223, "dataset_name": "refcoco", "area": 18244.189499999993, "iscrowd": 0, "image_id": 48, "category_id": 16, "bbox_list": [ [ 402.15, 255.0, 602.23, 419.43 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581686.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right bird.", "normal_caption": "right bird", "solution": [ 402.15, 255.0, 603.23, 420.43 ], "normalized_solution": [ 628, 600, 942, 989 ] }, { "height": 425, "width": 640, "id": 49, "original_id": 38565, "dataset_name": "refcoco", "area": 14125.245749999998, "iscrowd": 0, "image_id": 49, "category_id": 16, "bbox_list": [ [ 272.37, 263.23, 410.28999999999996, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581686.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left bird.", "normal_caption": "left bird", "solution": [ 272.37, 263.23, 411.29, 425.0 ], "normalized_solution": [ 425, 619, 642, 1000 ] }, { "height": 425, "width": 640, "id": 50, "original_id": 38565, "dataset_name": "refcoco", "area": 14125.245749999998, "iscrowd": 0, "image_id": 50, "category_id": 16, "bbox_list": [ [ 272.37, 263.23, 410.28999999999996, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581686.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left bird.", "normal_caption": "left bird", "solution": [ 272.37, 263.23, 411.29, 425.0 ], "normalized_solution": [ 425, 619, 642, 1000 ] }, { "height": 425, "width": 640, "id": 51, "original_id": 38565, "dataset_name": "refcoco", "area": 14125.245749999998, "iscrowd": 0, "image_id": 51, "category_id": 16, "bbox_list": [ [ 272.37, 263.23, 410.28999999999996, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581686.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bird on left.", "normal_caption": "bird on left", "solution": [ 272.37, 263.23, 411.29, 425.0 ], "normalized_solution": [ 425, 619, 642, 1000 ] }, { "height": 640, "width": 480, "id": 52, "original_id": 1103476, "dataset_name": "refcoco", "area": 19401.545400000006, "iscrowd": 0, "image_id": 52, "category_id": 73, "bbox_list": [ [ 220.04, 207.1, 476.48, 391.63 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second laptop from front right center.", "normal_caption": "second laptop from front right center", "solution": [ 220.04, 207.1, 477.48, 392.63 ], "normalized_solution": [ 458, 323, 994, 613 ] }, { "height": 640, "width": 480, "id": 53, "original_id": 1103476, "dataset_name": "refcoco", "area": 19401.545400000006, "iscrowd": 0, "image_id": 53, "category_id": 73, "bbox_list": [ [ 220.04, 207.1, 476.48, 391.63 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: laptop second from front.", "normal_caption": "laptop second from front", "solution": [ 220.04, 207.1, 477.48, 392.63 ], "normalized_solution": [ 458, 323, 994, 613 ] }, { "height": 640, "width": 480, "id": 54, "original_id": 1103476, "dataset_name": "refcoco", "area": 19401.545400000006, "iscrowd": 0, "image_id": 54, "category_id": 73, "bbox_list": [ [ 220.04, 207.1, 476.48, 391.63 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: laptop above cellphone right.", "normal_caption": "laptop above cellphone right", "solution": [ 220.04, 207.1, 477.48, 392.63 ], "normalized_solution": [ 458, 323, 994, 613 ] }, { "height": 640, "width": 480, "id": 55, "original_id": 1101817, "dataset_name": "refcoco", "area": 106786.83825000004, "iscrowd": 0, "image_id": 55, "category_id": 73, "bbox_list": [ [ 0.0, 151.01, 427.58, 628.9300000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the laptop nearest us.", "normal_caption": "the laptop nearest us", "solution": [ 0.0, 151.01, 428.58, 629.93 ], "normalized_solution": [ 0, 235, 892, 984 ] }, { "height": 640, "width": 480, "id": 56, "original_id": 1101817, "dataset_name": "refcoco", "area": 106786.83825000004, "iscrowd": 0, "image_id": 56, "category_id": 73, "bbox_list": [ [ 0.0, 151.01, 427.58, 628.9300000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: monitor left.", "normal_caption": "monitor left", "solution": [ 0.0, 151.01, 428.58, 629.93 ], "normalized_solution": [ 0, 235, 892, 984 ] }, { "height": 640, "width": 480, "id": 57, "original_id": 556799, "dataset_name": "refcoco", "area": 24497.341400000005, "iscrowd": 0, "image_id": 57, "category_id": 1, "bbox_list": [ [ 260.41, 378.05, 479.0, 605.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand in the front bottom right.", "normal_caption": "hand in the front bottom right", "solution": [ 260.41, 378.05, 480.0, 606.8 ], "normalized_solution": [ 542, 590, 1000, 948 ] }, { "height": 640, "width": 480, "id": 58, "original_id": 556799, "dataset_name": "refcoco", "area": 24497.341400000005, "iscrowd": 0, "image_id": 58, "category_id": 1, "bbox_list": [ [ 260.41, 378.05, 479.0, 605.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: fronnt hand.", "normal_caption": "fronnt hand", "solution": [ 260.41, 378.05, 480.0, 606.8 ], "normalized_solution": [ 542, 590, 1000, 948 ] }, { "height": 640, "width": 480, "id": 59, "original_id": 1758997, "dataset_name": "refcoco", "area": 16302.913300000004, "iscrowd": 0, "image_id": 59, "category_id": 1, "bbox_list": [ [ 379.69, 2.35, 479.0, 240.26999999999998 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: upper right corner.", "normal_caption": "upper right corner", "solution": [ 379.69, 2.35, 480.0, 241.27 ], "normalized_solution": [ 791, 3, 1000, 376 ] }, { "height": 640, "width": 480, "id": 60, "original_id": 1758997, "dataset_name": "refcoco", "area": 16302.913300000004, "iscrowd": 0, "image_id": 60, "category_id": 1, "bbox_list": [ [ 379.69, 2.35, 479.0, 240.26999999999998 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top right of image.", "normal_caption": "top right of image", "solution": [ 379.69, 2.35, 480.0, 241.27 ], "normalized_solution": [ 791, 3, 1000, 376 ] }, { "height": 640, "width": 480, "id": 61, "original_id": 1758997, "dataset_name": "refcoco", "area": 16302.913300000004, "iscrowd": 0, "image_id": 61, "category_id": 1, "bbox_list": [ [ 379.69, 2.35, 479.0, 240.26999999999998 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: upper right corner.", "normal_caption": "upper right corner", "solution": [ 379.69, 2.35, 480.0, 241.27 ], "normalized_solution": [ 791, 3, 1000, 376 ] }, { "height": 332, "width": 500, "id": 62, "original_id": 2157900, "dataset_name": "refcoco", "area": 13833.504999999997, "iscrowd": 0, "image_id": 62, "category_id": 1, "bbox_list": [ [ 0.0, 130.12, 147.71, 297.71000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on left white hat.", "normal_caption": "man on left white hat", "solution": [ 0.0, 130.12, 148.71, 298.71 ], "normalized_solution": [ 0, 391, 297, 899 ] }, { "height": 332, "width": 500, "id": 63, "original_id": 2157900, "dataset_name": "refcoco", "area": 13833.504999999997, "iscrowd": 0, "image_id": 63, "category_id": 1, "bbox_list": [ [ 0.0, 130.12, 147.71, 297.71000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left dude.", "normal_caption": "left dude", "solution": [ 0.0, 130.12, 148.71, 298.71 ], "normalized_solution": [ 0, 391, 297, 899 ] }, { "height": 332, "width": 500, "id": 64, "original_id": 2157900, "dataset_name": "refcoco", "area": 13833.504999999997, "iscrowd": 0, "image_id": 64, "category_id": 1, "bbox_list": [ [ 0.0, 130.12, 147.71, 297.71000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hat.", "normal_caption": "hat", "solution": [ 0.0, 130.12, 148.71, 298.71 ], "normalized_solution": [ 0, 391, 297, 899 ] }, { "height": 332, "width": 500, "id": 65, "original_id": 508442, "dataset_name": "refcoco", "area": 20918.16165, "iscrowd": 0, "image_id": 65, "category_id": 1, "bbox_list": [ [ 347.67, 124.47, 497.37, 327.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on right.", "normal_caption": "guy on right", "solution": [ 347.67, 124.47, 498.37, 328.89 ], "normalized_solution": [ 695, 374, 996, 990 ] }, { "height": 332, "width": 500, "id": 66, "original_id": 508442, "dataset_name": "refcoco", "area": 20918.16165, "iscrowd": 0, "image_id": 66, "category_id": 1, "bbox_list": [ [ 347.67, 124.47, 497.37, 327.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bald man.", "normal_caption": "bald man", "solution": [ 347.67, 124.47, 498.37, 328.89 ], "normalized_solution": [ 695, 374, 996, 990 ] }, { "height": 332, "width": 500, "id": 67, "original_id": 508442, "dataset_name": "refcoco", "area": 20918.16165, "iscrowd": 0, "image_id": 67, "category_id": 1, "bbox_list": [ [ 347.67, 124.47, 497.37, 327.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bald guy.", "normal_caption": "bald guy", "solution": [ 347.67, 124.47, 498.37, 328.89 ], "normalized_solution": [ 695, 374, 996, 990 ] }, { "height": 332, "width": 500, "id": 68, "original_id": 500335, "dataset_name": "refcoco", "area": 32940.15345000001, "iscrowd": 0, "image_id": 68, "category_id": 1, "bbox_list": [ [ 133.4, 97.99, 354.98, 327.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: center girl.", "normal_caption": "center girl", "solution": [ 133.4, 97.99, 355.98, 328.07 ], "normalized_solution": [ 266, 295, 711, 988 ] }, { "height": 332, "width": 500, "id": 69, "original_id": 500335, "dataset_name": "refcoco", "area": 32940.15345000001, "iscrowd": 0, "image_id": 69, "category_id": 1, "bbox_list": [ [ 133.4, 97.99, 354.98, 327.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 133.4, 97.99, 355.98, 328.07 ], "normalized_solution": [ 266, 295, 711, 988 ] }, { "height": 332, "width": 500, "id": 70, "original_id": 500335, "dataset_name": "refcoco", "area": 32940.15345000001, "iscrowd": 0, "image_id": 70, "category_id": 1, "bbox_list": [ [ 133.4, 97.99, 354.98, 327.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581629.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 133.4, 97.99, 355.98, 328.07 ], "normalized_solution": [ 266, 295, 711, 988 ] }, { "height": 514, "width": 640, "id": 71, "original_id": 2218461, "dataset_name": "refcoco", "area": 91175.75775, "iscrowd": 0, "image_id": 71, "category_id": 54, "bbox_list": [ [ 377.27, 25.47, 609.22, 508.08000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581481.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right half.", "normal_caption": "right half", "solution": [ 377.27, 25.47, 610.22, 509.08 ], "normalized_solution": [ 589, 49, 953, 990 ] }, { "height": 514, "width": 640, "id": 72, "original_id": 2218461, "dataset_name": "refcoco", "area": 91175.75775, "iscrowd": 0, "image_id": 72, "category_id": 54, "bbox_list": [ [ 377.27, 25.47, 609.22, 508.08000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581481.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: what are these foods thing on the right.", "normal_caption": "what are these foods thing on the right", "solution": [ 377.27, 25.47, 610.22, 509.08 ], "normalized_solution": [ 589, 49, 953, 990 ] }, { "height": 514, "width": 640, "id": 73, "original_id": 2218461, "dataset_name": "refcoco", "area": 91175.75775, "iscrowd": 0, "image_id": 73, "category_id": 54, "bbox_list": [ [ 377.27, 25.47, 609.22, 508.08000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581481.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chicken.", "normal_caption": "chicken", "solution": [ 377.27, 25.47, 610.22, 509.08 ], "normalized_solution": [ 589, 49, 953, 990 ] }, { "height": 514, "width": 640, "id": 74, "original_id": 309123, "dataset_name": "refcoco", "area": 109294.50130000003, "iscrowd": 0, "image_id": 74, "category_id": 54, "bbox_list": [ [ 153.28, 0.0, 415.03999999999996, 507.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581481.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: food left with onions.", "normal_caption": "food left with onions", "solution": [ 153.28, 0.0, 416.04, 508.01 ], "normalized_solution": [ 239, 0, 650, 988 ] }, { "height": 514, "width": 640, "id": 75, "original_id": 309123, "dataset_name": "refcoco", "area": 109294.50130000003, "iscrowd": 0, "image_id": 75, "category_id": 54, "bbox_list": [ [ 153.28, 0.0, 415.03999999999996, 507.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581481.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the carrots.", "normal_caption": "the carrots", "solution": [ 153.28, 0.0, 416.04, 508.01 ], "normalized_solution": [ 239, 0, 650, 988 ] }, { "height": 514, "width": 640, "id": 76, "original_id": 309123, "dataset_name": "refcoco", "area": 109294.50130000003, "iscrowd": 0, "image_id": 76, "category_id": 54, "bbox_list": [ [ 153.28, 0.0, 415.03999999999996, 507.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581481.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: side with onion.", "normal_caption": "side with onion", "solution": [ 153.28, 0.0, 416.04, 508.01 ], "normalized_solution": [ 239, 0, 650, 988 ] }, { "height": 478, "width": 640, "id": 77, "original_id": 75700, "dataset_name": "refcoco", "area": 16145.659049999995, "iscrowd": 0, "image_id": 77, "category_id": 21, "bbox_list": [ [ 2.06, 166.53, 94.60000000000001, 431.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow on left front.", "normal_caption": "cow on left front", "solution": [ 2.06, 166.53, 95.6, 432.77 ], "normalized_solution": [ 3, 348, 149, 905 ] }, { "height": 478, "width": 640, "id": 78, "original_id": 75700, "dataset_name": "refcoco", "area": 16145.659049999995, "iscrowd": 0, "image_id": 78, "category_id": 21, "bbox_list": [ [ 2.06, 166.53, 94.60000000000001, 431.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left cow.", "normal_caption": "left cow", "solution": [ 2.06, 166.53, 95.6, 432.77 ], "normalized_solution": [ 3, 348, 149, 905 ] }, { "height": 478, "width": 640, "id": 79, "original_id": 75700, "dataset_name": "refcoco", "area": 16145.659049999995, "iscrowd": 0, "image_id": 79, "category_id": 21, "bbox_list": [ [ 2.06, 166.53, 94.60000000000001, 431.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: leftmost animal edge of pic.", "normal_caption": "leftmost animal edge of pic", "solution": [ 2.06, 166.53, 95.6, 432.77 ], "normalized_solution": [ 3, 348, 149, 905 ] }, { "height": 478, "width": 640, "id": 80, "original_id": 71392, "dataset_name": "refcoco", "area": 38059.44980000001, "iscrowd": 0, "image_id": 80, "category_id": 21, "bbox_list": [ [ 364.92, 161.39, 632.22, 406.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow lying down on right.", "normal_caption": "cow lying down on right", "solution": [ 364.92, 161.39, 633.22, 407.07 ], "normalized_solution": [ 570, 337, 989, 851 ] }, { "height": 478, "width": 640, "id": 81, "original_id": 71392, "dataset_name": "refcoco", "area": 38059.44980000001, "iscrowd": 0, "image_id": 81, "category_id": 21, "bbox_list": [ [ 364.92, 161.39, 632.22, 406.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brown white cow laying down.", "normal_caption": "brown white cow laying down", "solution": [ 364.92, 161.39, 633.22, 407.07 ], "normalized_solution": [ 570, 337, 989, 851 ] }, { "height": 478, "width": 640, "id": 82, "original_id": 71392, "dataset_name": "refcoco", "area": 38059.44980000001, "iscrowd": 0, "image_id": 82, "category_id": 21, "bbox_list": [ [ 364.92, 161.39, 632.22, 406.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow sitting.", "normal_caption": "cow sitting", "solution": [ 364.92, 161.39, 633.22, 407.07 ], "normalized_solution": [ 570, 337, 989, 851 ] }, { "height": 478, "width": 640, "id": 83, "original_id": 70901, "dataset_name": "refcoco", "area": 21952.455300000005, "iscrowd": 0, "image_id": 83, "category_id": 21, "bbox_list": [ [ 174.7, 125.35, 317.16999999999996, 376.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: tail of cow in middle.", "normal_caption": "tail of cow in middle", "solution": [ 174.7, 125.35, 318.17, 377.77 ], "normalized_solution": [ 272, 262, 497, 790 ] }, { "height": 478, "width": 640, "id": 84, "original_id": 70901, "dataset_name": "refcoco", "area": 21952.455300000005, "iscrowd": 0, "image_id": 84, "category_id": 21, "bbox_list": [ [ 174.7, 125.35, 317.16999999999996, 376.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle cow butt.", "normal_caption": "middle cow butt", "solution": [ 174.7, 125.35, 318.17, 377.77 ], "normalized_solution": [ 272, 262, 497, 790 ] }, { "height": 478, "width": 640, "id": 85, "original_id": 70901, "dataset_name": "refcoco", "area": 21952.455300000005, "iscrowd": 0, "image_id": 85, "category_id": 21, "bbox_list": [ [ 174.7, 125.35, 317.16999999999996, 376.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581466.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow butt.", "normal_caption": "cow butt", "solution": [ 174.7, 125.35, 318.17, 377.77 ], "normalized_solution": [ 272, 262, 497, 790 ] }, { "height": 427, "width": 640, "id": 86, "original_id": 510191, "dataset_name": "refcoco", "area": 19203.686749999997, "iscrowd": 0, "image_id": 86, "category_id": 1, "bbox_list": [ [ 172.44, 150.55, 341.14, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in white.", "normal_caption": "woman in white", "solution": [ 172.44, 150.55, 342.14, 427.0 ], "normalized_solution": [ 269, 352, 534, 1000 ] }, { "height": 427, "width": 640, "id": 87, "original_id": 510191, "dataset_name": "refcoco", "area": 19203.686749999997, "iscrowd": 0, "image_id": 87, "category_id": 1, "bbox_list": [ [ 172.44, 150.55, 341.14, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: female in white shorts and hat.", "normal_caption": "female in white shorts and hat", "solution": [ 172.44, 150.55, 342.14, 427.0 ], "normalized_solution": [ 269, 352, 534, 1000 ] }, { "height": 427, "width": 640, "id": 88, "original_id": 510191, "dataset_name": "refcoco", "area": 19203.686749999997, "iscrowd": 0, "image_id": 88, "category_id": 1, "bbox_list": [ [ 172.44, 150.55, 341.14, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue shirt.", "normal_caption": "blue shirt", "solution": [ 172.44, 150.55, 342.14, 427.0 ], "normalized_solution": [ 269, 352, 534, 1000 ] }, { "height": 427, "width": 640, "id": 89, "original_id": 505664, "dataset_name": "refcoco", "area": 14772.5408, "iscrowd": 0, "image_id": 89, "category_id": 1, "bbox_list": [ [ 312.81, 168.88, 498.93, 420.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady in black on right.", "normal_caption": "lady in black on right", "solution": [ 312.81, 168.88, 499.93, 421.24 ], "normalized_solution": [ 488, 395, 781, 986 ] }, { "height": 427, "width": 640, "id": 90, "original_id": 505664, "dataset_name": "refcoco", "area": 14772.5408, "iscrowd": 0, "image_id": 90, "category_id": 1, "bbox_list": [ [ 312.81, 168.88, 498.93, 420.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in black.", "normal_caption": "girl in black", "solution": [ 312.81, 168.88, 499.93, 421.24 ], "normalized_solution": [ 488, 395, 781, 986 ] }, { "height": 427, "width": 640, "id": 91, "original_id": 505664, "dataset_name": "refcoco", "area": 14772.5408, "iscrowd": 0, "image_id": 91, "category_id": 1, "bbox_list": [ [ 312.81, 168.88, 498.93, 420.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in black.", "normal_caption": "woman in black", "solution": [ 312.81, 168.88, 499.93, 421.24 ], "normalized_solution": [ 488, 395, 781, 986 ] }, { "height": 640, "width": 480, "id": 92, "original_id": 2005581, "dataset_name": "refcoco", "area": 29261.368049999997, "iscrowd": 0, "image_id": 92, "category_id": 1, "bbox_list": [ [ 74.27, 70.18, 277.27, 295.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man cut face.", "normal_caption": "man cut face", "solution": [ 74.27, 70.18, 278.27, 296.11 ], "normalized_solution": [ 154, 109, 579, 462 ] }, { "height": 640, "width": 480, "id": 93, "original_id": 2005581, "dataset_name": "refcoco", "area": 29261.368049999997, "iscrowd": 0, "image_id": 93, "category_id": 1, "bbox_list": [ [ 74.27, 70.18, 277.27, 295.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: face cut out.", "normal_caption": "face cut out", "solution": [ 74.27, 70.18, 278.27, 296.11 ], "normalized_solution": [ 154, 109, 579, 462 ] }, { "height": 640, "width": 480, "id": 94, "original_id": 531973, "dataset_name": "refcoco", "area": 15359.557099999998, "iscrowd": 0, "image_id": 94, "category_id": 1, "bbox_list": [ [ 97.23, 307.22, 279.58, 468.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pirate picture on cake.", "normal_caption": "pirate picture on cake", "solution": [ 97.23, 307.22, 280.58, 469.13 ], "normalized_solution": [ 202, 480, 584, 733 ] }, { "height": 640, "width": 480, "id": 95, "original_id": 531973, "dataset_name": "refcoco", "area": 15359.557099999998, "iscrowd": 0, "image_id": 95, "category_id": 1, "bbox_list": [ [ 97.23, 307.22, 279.58, 468.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: picture on the cake.", "normal_caption": "picture on the cake", "solution": [ 97.23, 307.22, 280.58, 469.13 ], "normalized_solution": [ 202, 480, 584, 733 ] }, { "height": 640, "width": 480, "id": 96, "original_id": 531973, "dataset_name": "refcoco", "area": 15359.557099999998, "iscrowd": 0, "image_id": 96, "category_id": 1, "bbox_list": [ [ 97.23, 307.22, 279.58, 468.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid in pirate hat.", "normal_caption": "kid in pirate hat", "solution": [ 97.23, 307.22, 280.58, 469.13 ], "normalized_solution": [ 202, 480, 584, 733 ] }, { "height": 640, "width": 480, "id": 97, "original_id": 490700, "dataset_name": "refcoco", "area": 28520.92355, "iscrowd": 0, "image_id": 97, "category_id": 1, "bbox_list": [ [ 331.7, 0.0, 479.0, 262.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: fist.", "normal_caption": "fist", "solution": [ 331.7, 0.0, 480.0, 263.27 ], "normalized_solution": [ 691, 0, 1000, 411 ] }, { "height": 640, "width": 480, "id": 98, "original_id": 490700, "dataset_name": "refcoco", "area": 28520.92355, "iscrowd": 0, "image_id": 98, "category_id": 1, "bbox_list": [ [ 331.7, 0.0, 479.0, 262.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: fist.", "normal_caption": "fist", "solution": [ 331.7, 0.0, 480.0, 263.27 ], "normalized_solution": [ 691, 0, 1000, 411 ] }, { "height": 640, "width": 480, "id": 99, "original_id": 490700, "dataset_name": "refcoco", "area": 28520.92355, "iscrowd": 0, "image_id": 99, "category_id": 1, "bbox_list": [ [ 331.7, 0.0, 479.0, 262.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581425.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand in top right corner.", "normal_caption": "hand in top right corner", "solution": [ 331.7, 0.0, 480.0, 263.27 ], "normalized_solution": [ 691, 0, 1000, 411 ] }, { "height": 612, "width": 612, "id": 100, "original_id": 1991154, "dataset_name": "refcoco", "area": 34255.85784999999, "iscrowd": 0, "image_id": 100, "category_id": 85, "bbox_list": [ [ 388.29, 244.08, 599.8100000000001, 450.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: scale bottom right.", "normal_caption": "scale bottom right", "solution": [ 388.29, 244.08, 600.81, 451.81 ], "normalized_solution": [ 634, 398, 981, 738 ] }, { "height": 612, "width": 612, "id": 101, "original_id": 1991154, "dataset_name": "refcoco", "area": 34255.85784999999, "iscrowd": 0, "image_id": 101, "category_id": 85, "bbox_list": [ [ 388.29, 244.08, 599.8100000000001, 450.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom right clock.", "normal_caption": "bottom right clock", "solution": [ 388.29, 244.08, 600.81, 451.81 ], "normalized_solution": [ 634, 398, 981, 738 ] }, { "height": 612, "width": 612, "id": 102, "original_id": 1991154, "dataset_name": "refcoco", "area": 34255.85784999999, "iscrowd": 0, "image_id": 102, "category_id": 85, "bbox_list": [ [ 388.29, 244.08, 599.8100000000001, 450.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: clock on bottom right.", "normal_caption": "clock on bottom right", "solution": [ 388.29, 244.08, 600.81, 451.81 ], "normalized_solution": [ 634, 398, 981, 738 ] }, { "height": 612, "width": 612, "id": 103, "original_id": 1991009, "dataset_name": "refcoco", "area": 39669.524750000004, "iscrowd": 0, "image_id": 103, "category_id": 85, "bbox_list": [ [ 135.12, 235.26, 351.89, 455.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left clock.", "normal_caption": "bottom left clock", "solution": [ 135.12, 235.26, 352.89, 456.22 ], "normalized_solution": [ 220, 384, 576, 745 ] }, { "height": 612, "width": 612, "id": 104, "original_id": 1991009, "dataset_name": "refcoco", "area": 39669.524750000004, "iscrowd": 0, "image_id": 104, "category_id": 85, "bbox_list": [ [ 135.12, 235.26, 351.89, 455.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: clock next to womans left foot.", "normal_caption": "clock next to womans left foot", "solution": [ 135.12, 235.26, 352.89, 456.22 ], "normalized_solution": [ 220, 384, 576, 745 ] }, { "height": 612, "width": 612, "id": 105, "original_id": 1991009, "dataset_name": "refcoco", "area": 39669.524750000004, "iscrowd": 0, "image_id": 105, "category_id": 85, "bbox_list": [ [ 135.12, 235.26, 351.89, 455.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left clock.", "normal_caption": "bottom left clock", "solution": [ 135.12, 235.26, 352.89, 456.22 ], "normalized_solution": [ 220, 384, 576, 745 ] }, { "height": 612, "width": 612, "id": 106, "original_id": 337651, "dataset_name": "refcoco", "area": 37597.7934, "iscrowd": 0, "image_id": 106, "category_id": 85, "bbox_list": [ [ 15.09, 30.19, 226.78, 239.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top on left clock.", "normal_caption": "top on left clock", "solution": [ 15.09, 30.19, 227.78, 240.13 ], "normalized_solution": [ 24, 49, 372, 392 ] }, { "height": 612, "width": 612, "id": 107, "original_id": 337651, "dataset_name": "refcoco", "area": 37597.7934, "iscrowd": 0, "image_id": 107, "category_id": 85, "bbox_list": [ [ 15.09, 30.19, 226.78, 239.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left clock.", "normal_caption": "top left clock", "solution": [ 15.09, 30.19, 227.78, 240.13 ], "normalized_solution": [ 24, 49, 372, 392 ] }, { "height": 612, "width": 612, "id": 108, "original_id": 337651, "dataset_name": "refcoco", "area": 37597.7934, "iscrowd": 0, "image_id": 108, "category_id": 85, "bbox_list": [ [ 15.09, 30.19, 226.78, 239.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left corner clock.", "normal_caption": "top left corner clock", "solution": [ 15.09, 30.19, 227.78, 240.13 ], "normalized_solution": [ 24, 49, 372, 392 ] }, { "height": 612, "width": 612, "id": 109, "original_id": 336962, "dataset_name": "refcoco", "area": 35743.24835, "iscrowd": 0, "image_id": 109, "category_id": 85, "bbox_list": [ [ 248.3, 16.02, 456.27, 222.46 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top right clock.", "normal_caption": "top right clock", "solution": [ 248.3, 16.02, 457.27, 223.46 ], "normalized_solution": [ 405, 26, 747, 365 ] }, { "height": 612, "width": 612, "id": 110, "original_id": 336962, "dataset_name": "refcoco", "area": 35743.24835, "iscrowd": 0, "image_id": 110, "category_id": 85, "bbox_list": [ [ 248.3, 16.02, 456.27, 222.46 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: one on the top right.", "normal_caption": "one on the top right", "solution": [ 248.3, 16.02, 457.27, 223.46 ], "normalized_solution": [ 405, 26, 747, 365 ] }, { "height": 612, "width": 612, "id": 111, "original_id": 336962, "dataset_name": "refcoco", "area": 35743.24835, "iscrowd": 0, "image_id": 111, "category_id": 85, "bbox_list": [ [ 248.3, 16.02, 456.27, 222.46 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581419.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: upper right clock.", "normal_caption": "upper right clock", "solution": [ 248.3, 16.02, 457.27, 223.46 ], "normalized_solution": [ 405, 26, 747, 365 ] }, { "height": 424, "width": 640, "id": 112, "original_id": 57804, "dataset_name": "refcoco", "area": 44479.57560000001, "iscrowd": 0, "image_id": 112, "category_id": 19, "bbox_list": [ [ 79.33, 228.36, 638.69, 423.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581354.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse in front close up.", "normal_caption": "horse in front close up", "solution": [ 79.33, 228.36, 639.69, 424.0 ], "normalized_solution": [ 123, 538, 999, 1000 ] }, { "height": 424, "width": 640, "id": 113, "original_id": 57804, "dataset_name": "refcoco", "area": 44479.57560000001, "iscrowd": 0, "image_id": 113, "category_id": 19, "bbox_list": [ [ 79.33, 228.36, 638.69, 423.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581354.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white hair front horse.", "normal_caption": "white hair front horse", "solution": [ 79.33, 228.36, 639.69, 424.0 ], "normalized_solution": [ 123, 538, 999, 1000 ] }, { "height": 424, "width": 640, "id": 114, "original_id": 57804, "dataset_name": "refcoco", "area": 44479.57560000001, "iscrowd": 0, "image_id": 114, "category_id": 19, "bbox_list": [ [ 79.33, 228.36, 638.69, 423.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581354.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse up front.", "normal_caption": "horse up front", "solution": [ 79.33, 228.36, 639.69, 424.0 ], "normalized_solution": [ 123, 538, 999, 1000 ] }, { "height": 424, "width": 640, "id": 115, "original_id": 55711, "dataset_name": "refcoco", "area": 21146.30755000001, "iscrowd": 0, "image_id": 115, "category_id": 19, "bbox_list": [ [ 222.92, 157.95, 510.35, 348.94 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581354.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far horse head.", "normal_caption": "far horse head", "solution": [ 222.92, 157.95, 511.35, 349.94 ], "normalized_solution": [ 348, 372, 798, 825 ] }, { "height": 424, "width": 640, "id": 116, "original_id": 55711, "dataset_name": "refcoco", "area": 21146.30755000001, "iscrowd": 0, "image_id": 116, "category_id": 19, "bbox_list": [ [ 222.92, 157.95, 510.35, 348.94 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581354.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse with pink girl riding on it.", "normal_caption": "horse with pink girl riding on it", "solution": [ 222.92, 157.95, 511.35, 349.94 ], "normalized_solution": [ 348, 372, 798, 825 ] }, { "height": 424, "width": 640, "id": 117, "original_id": 55711, "dataset_name": "refcoco", "area": 21146.30755000001, "iscrowd": 0, "image_id": 117, "category_id": 19, "bbox_list": [ [ 222.92, 157.95, 510.35, 348.94 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581354.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: back horse.", "normal_caption": "back horse", "solution": [ 222.92, 157.95, 511.35, 349.94 ], "normalized_solution": [ 348, 372, 798, 825 ] }, { "height": 640, "width": 427, "id": 118, "original_id": 459894, "dataset_name": "refcoco", "area": 94266.15455, "iscrowd": 0, "image_id": 118, "category_id": 1, "bbox_list": [ [ 4.3, 163.75, 330.48, 630.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581258.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: main person in photo in tie.", "normal_caption": "main person in photo in tie", "solution": [ 4.3, 163.75, 331.48, 631.56 ], "normalized_solution": [ 10, 255, 776, 986 ] }, { "height": 640, "width": 427, "id": 119, "original_id": 459894, "dataset_name": "refcoco", "area": 94266.15455, "iscrowd": 0, "image_id": 119, "category_id": 1, "bbox_list": [ [ 4.3, 163.75, 330.48, 630.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581258.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the man with an umbrella.", "normal_caption": "the man with an umbrella", "solution": [ 4.3, 163.75, 331.48, 631.56 ], "normalized_solution": [ 10, 255, 776, 986 ] }, { "height": 640, "width": 480, "id": 120, "original_id": 1816401, "dataset_name": "refcoco", "area": 22233.763750000002, "iscrowd": 0, "image_id": 120, "category_id": 17, "bbox_list": [ [ 227.5, 68.44, 479.0, 215.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581249.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cat on suit.", "normal_caption": "cat on suit", "solution": [ 227.5, 68.44, 480.0, 216.24 ], "normalized_solution": [ 473, 106, 1000, 337 ] }, { "height": 640, "width": 480, "id": 121, "original_id": 1816401, "dataset_name": "refcoco", "area": 22233.763750000002, "iscrowd": 0, "image_id": 121, "category_id": 17, "bbox_list": [ [ 227.5, 68.44, 479.0, 215.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581249.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black and white kitty.", "normal_caption": "black and white kitty", "solution": [ 227.5, 68.44, 480.0, 216.24 ], "normalized_solution": [ 473, 106, 1000, 337 ] }, { "height": 640, "width": 480, "id": 122, "original_id": 48922, "dataset_name": "refcoco", "area": 29519.741799999993, "iscrowd": 0, "image_id": 122, "category_id": 17, "bbox_list": [ [ 19.29, 318.34, 201.29, 618.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581249.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cat bottomleft.", "normal_caption": "cat bottomleft", "solution": [ 19.29, 318.34, 202.29, 619.65 ], "normalized_solution": [ 40, 497, 421, 968 ] }, { "height": 640, "width": 480, "id": 123, "original_id": 48922, "dataset_name": "refcoco", "area": 29519.741799999993, "iscrowd": 0, "image_id": 123, "category_id": 17, "bbox_list": [ [ 19.29, 318.34, 201.29, 618.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581249.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left cat.", "normal_caption": "left cat", "solution": [ 19.29, 318.34, 202.29, 619.65 ], "normalized_solution": [ 40, 497, 421, 968 ] }, { "height": 640, "width": 480, "id": 124, "original_id": 48922, "dataset_name": "refcoco", "area": 29519.741799999993, "iscrowd": 0, "image_id": 124, "category_id": 17, "bbox_list": [ [ 19.29, 318.34, 201.29, 618.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581249.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cat on floor.", "normal_caption": "cat on floor", "solution": [ 19.29, 318.34, 202.29, 619.65 ], "normalized_solution": [ 40, 497, 421, 968 ] }, { "height": 333, "width": 500, "id": 125, "original_id": 538268, "dataset_name": "refcoco", "area": 11555.38805, "iscrowd": 0, "image_id": 125, "category_id": 1, "bbox_list": [ [ 42.46, 120.08, 124.9, 332.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581227.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far left player.", "normal_caption": "far left player", "solution": [ 42.46, 120.08, 125.9, 333.0 ], "normalized_solution": [ 84, 360, 251, 1000 ] }, { "height": 333, "width": 500, "id": 126, "original_id": 538268, "dataset_name": "refcoco", "area": 11555.38805, "iscrowd": 0, "image_id": 126, "category_id": 1, "bbox_list": [ [ 42.46, 120.08, 124.9, 332.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581227.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left player.", "normal_caption": "left player", "solution": [ 42.46, 120.08, 125.9, 333.0 ], "normalized_solution": [ 84, 360, 251, 1000 ] }, { "height": 333, "width": 500, "id": 127, "original_id": 538268, "dataset_name": "refcoco", "area": 11555.38805, "iscrowd": 0, "image_id": 127, "category_id": 1, "bbox_list": [ [ 42.46, 120.08, 124.9, 332.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581227.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left player.", "normal_caption": "left player", "solution": [ 42.46, 120.08, 125.9, 333.0 ], "normalized_solution": [ 84, 360, 251, 1000 ] }, { "height": 333, "width": 500, "id": 128, "original_id": 534500, "dataset_name": "refcoco", "area": 27238.905450000006, "iscrowd": 0, "image_id": 128, "category_id": 1, "bbox_list": [ [ 263.09, 13.34, 425.96, 328.04999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581227.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right girl.", "normal_caption": "right girl", "solution": [ 263.09, 13.34, 426.96, 329.05 ], "normalized_solution": [ 526, 40, 853, 988 ] }, { "height": 333, "width": 500, "id": 129, "original_id": 534500, "dataset_name": "refcoco", "area": 27238.905450000006, "iscrowd": 0, "image_id": 129, "category_id": 1, "bbox_list": [ [ 263.09, 13.34, 425.96, 328.04999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581227.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl closest to us.", "normal_caption": "girl closest to us", "solution": [ 263.09, 13.34, 426.96, 329.05 ], "normalized_solution": [ 526, 40, 853, 988 ] }, { "height": 333, "width": 500, "id": 130, "original_id": 534500, "dataset_name": "refcoco", "area": 27238.905450000006, "iscrowd": 0, "image_id": 130, "category_id": 1, "bbox_list": [ [ 263.09, 13.34, 425.96, 328.04999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581227.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in front cam.", "normal_caption": "girl in front cam", "solution": [ 263.09, 13.34, 426.96, 329.05 ], "normalized_solution": [ 526, 40, 853, 988 ] }, { "height": 480, "width": 640, "id": 131, "original_id": 1074443, "dataset_name": "refcoco", "area": 71222.46115000002, "iscrowd": 0, "image_id": 131, "category_id": 59, "bbox_list": [ [ 0.0, 327.91, 639.0, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pizza up front.", "normal_caption": "pizza up front", "solution": [ 0.0, 327.91, 640.0, 474.61 ], "normalized_solution": [ 0, 683, 1000, 988 ] }, { "height": 480, "width": 640, "id": 132, "original_id": 1074443, "dataset_name": "refcoco", "area": 71222.46115000002, "iscrowd": 0, "image_id": 132, "category_id": 59, "bbox_list": [ [ 0.0, 327.91, 639.0, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: click on the food in the foreground.", "normal_caption": "click on the food in the foreground", "solution": [ 0.0, 327.91, 640.0, 474.61 ], "normalized_solution": [ 0, 683, 1000, 988 ] }, { "height": 480, "width": 640, "id": 133, "original_id": 1074443, "dataset_name": "refcoco", "area": 71222.46115000002, "iscrowd": 0, "image_id": 133, "category_id": 59, "bbox_list": [ [ 0.0, 327.91, 639.0, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pizzzza.", "normal_caption": "pizzzza", "solution": [ 0.0, 327.91, 640.0, 474.61 ], "normalized_solution": [ 0, 683, 1000, 988 ] }, { "height": 480, "width": 640, "id": 134, "original_id": 1073591, "dataset_name": "refcoco", "area": 10395.064899999998, "iscrowd": 0, "image_id": 134, "category_id": 59, "bbox_list": [ [ 357.47, 317.7, 638.3800000000001, 376.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pizza back right.", "normal_caption": "pizza back right", "solution": [ 357.47, 317.7, 639.38, 377.8 ], "normalized_solution": [ 558, 661, 999, 787 ] }, { "height": 480, "width": 640, "id": 135, "original_id": 1073591, "dataset_name": "refcoco", "area": 10395.064899999998, "iscrowd": 0, "image_id": 135, "category_id": 59, "bbox_list": [ [ 357.47, 317.7, 638.3800000000001, 376.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pizza on right.", "normal_caption": "pizza on right", "solution": [ 357.47, 317.7, 639.38, 377.8 ], "normalized_solution": [ 558, 661, 999, 787 ] }, { "height": 480, "width": 640, "id": 136, "original_id": 1073591, "dataset_name": "refcoco", "area": 10395.064899999998, "iscrowd": 0, "image_id": 136, "category_id": 59, "bbox_list": [ [ 357.47, 317.7, 638.3800000000001, 376.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pizza in back.", "normal_caption": "pizza in back", "solution": [ 357.47, 317.7, 639.38, 377.8 ], "normalized_solution": [ 558, 661, 999, 787 ] }, { "height": 480, "width": 640, "id": 137, "original_id": 464938, "dataset_name": "refcoco", "area": 18074.825250000005, "iscrowd": 0, "image_id": 137, "category_id": 1, "bbox_list": [ [ 371.76, 100.24, 530.28, 325.58 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: plaid.", "normal_caption": "plaid", "solution": [ 371.76, 100.24, 531.28, 326.58 ], "normalized_solution": [ 580, 208, 830, 680 ] }, { "height": 480, "width": 640, "id": 138, "original_id": 464938, "dataset_name": "refcoco", "area": 18074.825250000005, "iscrowd": 0, "image_id": 138, "category_id": 1, "bbox_list": [ [ 371.76, 100.24, 530.28, 325.58 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: plaid shirt on right.", "normal_caption": "plaid shirt on right", "solution": [ 371.76, 100.24, 531.28, 326.58 ], "normalized_solution": [ 580, 208, 830, 680 ] }, { "height": 480, "width": 640, "id": 139, "original_id": 464938, "dataset_name": "refcoco", "area": 18074.825250000005, "iscrowd": 0, "image_id": 139, "category_id": 1, "bbox_list": [ [ 371.76, 100.24, 530.28, 325.58 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: plaid shirt.", "normal_caption": "plaid shirt", "solution": [ 371.76, 100.24, 531.28, 326.58 ], "normalized_solution": [ 580, 208, 830, 680 ] }, { "height": 480, "width": 640, "id": 140, "original_id": 445980, "dataset_name": "refcoco", "area": 82007.5595, "iscrowd": 0, "image_id": 140, "category_id": 1, "bbox_list": [ [ 1.08, 1.08, 377.60999999999996, 343.09 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on the left.", "normal_caption": "person on the left", "solution": [ 1.08, 1.08, 378.61, 344.09 ], "normalized_solution": [ 1, 2, 591, 716 ] }, { "height": 480, "width": 640, "id": 141, "original_id": 445980, "dataset_name": "refcoco", "area": 82007.5595, "iscrowd": 0, "image_id": 141, "category_id": 1, "bbox_list": [ [ 1.08, 1.08, 377.60999999999996, 343.09 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person in white.", "normal_caption": "person in white", "solution": [ 1.08, 1.08, 378.61, 344.09 ], "normalized_solution": [ 1, 2, 591, 716 ] }, { "height": 480, "width": 640, "id": 142, "original_id": 445980, "dataset_name": "refcoco", "area": 82007.5595, "iscrowd": 0, "image_id": 142, "category_id": 1, "bbox_list": [ [ 1.08, 1.08, 377.60999999999996, 343.09 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581199.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on left side.", "normal_caption": "person on left side", "solution": [ 1.08, 1.08, 378.61, 344.09 ], "normalized_solution": [ 1, 2, 591, 716 ] }, { "height": 425, "width": 640, "id": 143, "original_id": 516597, "dataset_name": "refcoco", "area": 21478.795700000002, "iscrowd": 0, "image_id": 143, "category_id": 1, "bbox_list": [ [ 0.0, 0.96, 126.98, 223.44 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: straps.", "normal_caption": "straps", "solution": [ 0.0, 0.96, 127.98, 224.44 ], "normalized_solution": [ 0, 2, 199, 528 ] }, { "height": 425, "width": 640, "id": 144, "original_id": 516597, "dataset_name": "refcoco", "area": 21478.795700000002, "iscrowd": 0, "image_id": 144, "category_id": 1, "bbox_list": [ [ 0.0, 0.96, 126.98, 223.44 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left corner of pic.", "normal_caption": "top left corner of pic", "solution": [ 0.0, 0.96, 127.98, 224.44 ], "normalized_solution": [ 0, 2, 199, 528 ] }, { "height": 425, "width": 640, "id": 145, "original_id": 516597, "dataset_name": "refcoco", "area": 21478.795700000002, "iscrowd": 0, "image_id": 145, "category_id": 1, "bbox_list": [ [ 0.0, 0.96, 126.98, 223.44 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left corner.", "normal_caption": "top left corner", "solution": [ 0.0, 0.96, 127.98, 224.44 ], "normalized_solution": [ 0, 2, 199, 528 ] }, { "height": 425, "width": 640, "id": 146, "original_id": 484402, "dataset_name": "refcoco", "area": 15355.57799999999, "iscrowd": 0, "image_id": 146, "category_id": 1, "bbox_list": [ [ 502.18, 0.0, 624.29, 241.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person in background in striped shirt.", "normal_caption": "person in background in striped shirt", "solution": [ 502.18, 0.0, 625.29, 242.53 ], "normalized_solution": [ 784, 0, 977, 570 ] }, { "height": 425, "width": 640, "id": 147, "original_id": 484402, "dataset_name": "refcoco", "area": 15355.57799999999, "iscrowd": 0, "image_id": 147, "category_id": 1, "bbox_list": [ [ 502.18, 0.0, 624.29, 241.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: strip shirt boy top right.", "normal_caption": "strip shirt boy top right", "solution": [ 502.18, 0.0, 625.29, 242.53 ], "normalized_solution": [ 784, 0, 977, 570 ] }, { "height": 425, "width": 640, "id": 148, "original_id": 484402, "dataset_name": "refcoco", "area": 15355.57799999999, "iscrowd": 0, "image_id": 148, "category_id": 1, "bbox_list": [ [ 502.18, 0.0, 624.29, 241.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: striped shirt.", "normal_caption": "striped shirt", "solution": [ 502.18, 0.0, 625.29, 242.53 ], "normalized_solution": [ 784, 0, 977, 570 ] }, { "height": 425, "width": 640, "id": 149, "original_id": 2163529, "dataset_name": "refcoco", "area": 74406.8812, "iscrowd": 0, "image_id": 149, "category_id": 1, "bbox_list": [ [ 229.67, 28.95, 600.85, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman looking at you.", "normal_caption": "woman looking at you", "solution": [ 229.67, 28.95, 601.85, 425.0 ], "normalized_solution": [ 358, 68, 940, 1000 ] }, { "height": 425, "width": 640, "id": 150, "original_id": 2163529, "dataset_name": "refcoco", "area": 74406.8812, "iscrowd": 0, "image_id": 150, "category_id": 1, "bbox_list": [ [ 229.67, 28.95, 600.85, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the girl looking at cam.", "normal_caption": "the girl looking at cam", "solution": [ 229.67, 28.95, 601.85, 425.0 ], "normalized_solution": [ 358, 68, 940, 1000 ] }, { "height": 425, "width": 640, "id": 151, "original_id": 2163529, "dataset_name": "refcoco", "area": 74406.8812, "iscrowd": 0, "image_id": 151, "category_id": 1, "bbox_list": [ [ 229.67, 28.95, 600.85, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl looking at you.", "normal_caption": "girl looking at you", "solution": [ 229.67, 28.95, 601.85, 425.0 ], "normalized_solution": [ 358, 68, 940, 1000 ] }, { "height": 425, "width": 640, "id": 152, "original_id": 1757650, "dataset_name": "refcoco", "area": 15704.0492, "iscrowd": 0, "image_id": 152, "category_id": 1, "bbox_list": [ [ 215.1, 308.62, 377.84000000000003, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: head of person woman looking at bottom.", "normal_caption": "head of person woman looking at bottom", "solution": [ 215.1, 308.62, 378.84, 425.0 ], "normalized_solution": [ 336, 726, 591, 1000 ] }, { "height": 425, "width": 640, "id": 153, "original_id": 1757650, "dataset_name": "refcoco", "area": 15704.0492, "iscrowd": 0, "image_id": 153, "category_id": 1, "bbox_list": [ [ 215.1, 308.62, 377.84000000000003, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blurred head left of the woman.", "normal_caption": "blurred head left of the woman", "solution": [ 215.1, 308.62, 378.84, 425.0 ], "normalized_solution": [ 336, 726, 591, 1000 ] }, { "height": 425, "width": 640, "id": 154, "original_id": 1757650, "dataset_name": "refcoco", "area": 15704.0492, "iscrowd": 0, "image_id": 154, "category_id": 1, "bbox_list": [ [ 215.1, 308.62, 377.84000000000003, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581198.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top of head bottom middle.", "normal_caption": "top of head bottom middle", "solution": [ 215.1, 308.62, 378.84, 425.0 ], "normalized_solution": [ 336, 726, 591, 1000 ] }, { "height": 427, "width": 640, "id": 155, "original_id": 174739, "dataset_name": "refcoco", "area": 93564.44255, "iscrowd": 0, "image_id": 155, "category_id": 7, "bbox_list": [ [ 57.44, 97.65, 556.21, 388.65999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581196.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: train.", "normal_caption": "train", "solution": [ 57.44, 97.65, 557.21, 389.66 ], "normalized_solution": [ 89, 228, 870, 912 ] }, { "height": 427, "width": 640, "id": 156, "original_id": 174739, "dataset_name": "refcoco", "area": 93564.44255, "iscrowd": 0, "image_id": 156, "category_id": 7, "bbox_list": [ [ 57.44, 97.65, 556.21, 388.65999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581196.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: train.", "normal_caption": "train", "solution": [ 57.44, 97.65, 557.21, 389.66 ], "normalized_solution": [ 89, 228, 870, 912 ] }, { "height": 427, "width": 640, "id": 157, "original_id": 174739, "dataset_name": "refcoco", "area": 93564.44255, "iscrowd": 0, "image_id": 157, "category_id": 7, "bbox_list": [ [ 57.44, 97.65, 556.21, 388.65999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581196.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: train.", "normal_caption": "train", "solution": [ 57.44, 97.65, 557.21, 389.66 ], "normalized_solution": [ 89, 228, 870, 912 ] }, { "height": 495, "width": 640, "id": 158, "original_id": 1943799, "dataset_name": "refcoco", "area": 11619.683249999996, "iscrowd": 0, "image_id": 158, "category_id": 62, "bbox_list": [ [ 509.0, 215.86, 639.0, 371.94000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: striped chair by the piano.", "normal_caption": "striped chair by the piano", "solution": [ 509.0, 215.86, 640.0, 372.94 ], "normalized_solution": [ 795, 436, 1000, 753 ] }, { "height": 495, "width": 640, "id": 159, "original_id": 1943799, "dataset_name": "refcoco", "area": 11619.683249999996, "iscrowd": 0, "image_id": 159, "category_id": 62, "bbox_list": [ [ 509.0, 215.86, 639.0, 371.94000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right chair facing us.", "normal_caption": "right chair facing us", "solution": [ 509.0, 215.86, 640.0, 372.94 ], "normalized_solution": [ 795, 436, 1000, 753 ] }, { "height": 495, "width": 640, "id": 160, "original_id": 1943799, "dataset_name": "refcoco", "area": 11619.683249999996, "iscrowd": 0, "image_id": 160, "category_id": 62, "bbox_list": [ [ 509.0, 215.86, 639.0, 371.94000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right most chair kinda dark.", "normal_caption": "right most chair kinda dark", "solution": [ 509.0, 215.86, 640.0, 372.94 ], "normalized_solution": [ 795, 436, 1000, 753 ] }, { "height": 495, "width": 640, "id": 161, "original_id": 117142, "dataset_name": "refcoco", "area": 10424.89785, "iscrowd": 0, "image_id": 161, "category_id": 63, "bbox_list": [ [ 476.83, 402.93, 637.39, 494.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch arm bottom right.", "normal_caption": "couch arm bottom right", "solution": [ 476.83, 402.93, 638.39, 495.0 ], "normalized_solution": [ 745, 814, 997, 1000 ] }, { "height": 495, "width": 640, "id": 162, "original_id": 117142, "dataset_name": "refcoco", "area": 10424.89785, "iscrowd": 0, "image_id": 162, "category_id": 63, "bbox_list": [ [ 476.83, 402.93, 637.39, 494.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch.", "normal_caption": "couch", "solution": [ 476.83, 402.93, 638.39, 495.0 ], "normalized_solution": [ 745, 814, 997, 1000 ] }, { "height": 495, "width": 640, "id": 163, "original_id": 117142, "dataset_name": "refcoco", "area": 10424.89785, "iscrowd": 0, "image_id": 163, "category_id": 63, "bbox_list": [ [ 476.83, 402.93, 637.39, 494.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sofa on right cut off.", "normal_caption": "sofa on right cut off", "solution": [ 476.83, 402.93, 638.39, 495.0 ], "normalized_solution": [ 745, 814, 997, 1000 ] }, { "height": 495, "width": 640, "id": 164, "original_id": 1949970, "dataset_name": "refcoco", "area": 11993.873649999998, "iscrowd": 0, "image_id": 164, "category_id": 63, "bbox_list": [ [ 509.97, 215.46, 639.0, 366.34000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair on other side of table.", "normal_caption": "chair on other side of table", "solution": [ 509.97, 215.46, 640.0, 367.34 ], "normalized_solution": [ 796, 435, 1000, 742 ] }, { "height": 495, "width": 640, "id": 165, "original_id": 1949970, "dataset_name": "refcoco", "area": 11993.873649999998, "iscrowd": 0, "image_id": 165, "category_id": 63, "bbox_list": [ [ 509.97, 215.46, 639.0, 366.34000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: striped chair furthest right.", "normal_caption": "striped chair furthest right", "solution": [ 509.97, 215.46, 640.0, 367.34 ], "normalized_solution": [ 796, 435, 1000, 742 ] }, { "height": 495, "width": 640, "id": 166, "original_id": 113430, "dataset_name": "refcoco", "area": 42172.86925, "iscrowd": 0, "image_id": 166, "category_id": 63, "bbox_list": [ [ 167.13, 265.06, 448.23, 494.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch on the left.", "normal_caption": "couch on the left", "solution": [ 167.13, 265.06, 449.23, 495.0 ], "normalized_solution": [ 261, 535, 701, 1000 ] }, { "height": 495, "width": 640, "id": 167, "original_id": 113430, "dataset_name": "refcoco", "area": 42172.86925, "iscrowd": 0, "image_id": 167, "category_id": 63, "bbox_list": [ [ 167.13, 265.06, 448.23, 494.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: striped chair middle.", "normal_caption": "striped chair middle", "solution": [ 167.13, 265.06, 449.23, 495.0 ], "normalized_solution": [ 261, 535, 701, 1000 ] }, { "height": 495, "width": 640, "id": 168, "original_id": 113430, "dataset_name": "refcoco", "area": 42172.86925, "iscrowd": 0, "image_id": 168, "category_id": 63, "bbox_list": [ [ 167.13, 265.06, 448.23, 494.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair.", "normal_caption": "chair", "solution": [ 167.13, 265.06, 449.23, 495.0 ], "normalized_solution": [ 261, 535, 701, 1000 ] }, { "height": 495, "width": 640, "id": 169, "original_id": 103387, "dataset_name": "refcoco", "area": 40689.305100000005, "iscrowd": 0, "image_id": 169, "category_id": 62, "bbox_list": [ [ 169.26, 267.19, 448.23, 488.68 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair front center.", "normal_caption": "chair front center", "solution": [ 169.26, 267.19, 449.23, 489.68 ], "normalized_solution": [ 264, 539, 701, 989 ] }, { "height": 495, "width": 640, "id": 170, "original_id": 103387, "dataset_name": "refcoco", "area": 40689.305100000005, "iscrowd": 0, "image_id": 170, "category_id": 62, "bbox_list": [ [ 169.26, 267.19, 448.23, 488.68 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: striped couch.", "normal_caption": "striped couch", "solution": [ 169.26, 267.19, 449.23, 489.68 ], "normalized_solution": [ 264, 539, 701, 989 ] }, { "height": 495, "width": 640, "id": 171, "original_id": 103387, "dataset_name": "refcoco", "area": 40689.305100000005, "iscrowd": 0, "image_id": 171, "category_id": 62, "bbox_list": [ [ 169.26, 267.19, 448.23, 488.68 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: near chair.", "normal_caption": "near chair", "solution": [ 169.26, 267.19, 449.23, 489.68 ], "normalized_solution": [ 264, 539, 701, 989 ] }, { "height": 419, "width": 640, "id": 172, "original_id": 152760, "dataset_name": "refcoco", "area": 20540.955850000002, "iscrowd": 0, "image_id": 172, "category_id": 4, "bbox_list": [ [ 188.31, 194.97, 428.36, 365.33000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front center bike.", "normal_caption": "front center bike", "solution": [ 188.31, 194.97, 429.36, 366.33 ], "normalized_solution": [ 294, 465, 670, 874 ] }, { "height": 419, "width": 640, "id": 173, "original_id": 152760, "dataset_name": "refcoco", "area": 20540.955850000002, "iscrowd": 0, "image_id": 173, "category_id": 4, "bbox_list": [ [ 188.31, 194.97, 428.36, 365.33000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: motorcycle nearest to us.", "normal_caption": "motorcycle nearest to us", "solution": [ 188.31, 194.97, 429.36, 366.33 ], "normalized_solution": [ 294, 465, 670, 874 ] }, { "height": 419, "width": 640, "id": 174, "original_id": 152760, "dataset_name": "refcoco", "area": 20540.955850000002, "iscrowd": 0, "image_id": 174, "category_id": 4, "bbox_list": [ [ 188.31, 194.97, 428.36, 365.33000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle bike.", "normal_caption": "middle bike", "solution": [ 188.31, 194.97, 429.36, 366.33 ], "normalized_solution": [ 294, 465, 670, 874 ] }, { "height": 426, "width": 640, "id": 175, "original_id": 1791082, "dataset_name": "refcoco", "area": 81908.57584999996, "iscrowd": 0, "image_id": 175, "category_id": 4, "bbox_list": [ [ 77.57, 62.69, 514.46, 413.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: main bike.", "normal_caption": "main bike", "solution": [ 77.57, 62.69, 515.46, 414.53 ], "normalized_solution": [ 121, 147, 805, 973 ] }, { "height": 426, "width": 640, "id": 176, "original_id": 1791082, "dataset_name": "refcoco", "area": 81908.57584999996, "iscrowd": 0, "image_id": 176, "category_id": 4, "bbox_list": [ [ 77.57, 62.69, 514.46, 413.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: 13.", "normal_caption": "13", "solution": [ 77.57, 62.69, 515.46, 414.53 ], "normalized_solution": [ 121, 147, 805, 973 ] }, { "height": 426, "width": 640, "id": 177, "original_id": 1791082, "dataset_name": "refcoco", "area": 81908.57584999996, "iscrowd": 0, "image_id": 177, "category_id": 4, "bbox_list": [ [ 77.57, 62.69, 514.46, 413.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: main bike.", "normal_caption": "main bike", "solution": [ 77.57, 62.69, 515.46, 414.53 ], "normalized_solution": [ 121, 147, 805, 973 ] }, { "height": 426, "width": 640, "id": 178, "original_id": 246698, "dataset_name": "refcoco", "area": 13749.793800000003, "iscrowd": 0, "image_id": 178, "category_id": 4, "bbox_list": [ [ 0.0, 128.12, 133.02, 418.14 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far left front cycle.", "normal_caption": "far left front cycle", "solution": [ 0.0, 128.12, 134.02, 419.14 ], "normalized_solution": [ 0, 300, 209, 983 ] }, { "height": 426, "width": 640, "id": 179, "original_id": 246698, "dataset_name": "refcoco", "area": 13749.793800000003, "iscrowd": 0, "image_id": 179, "category_id": 4, "bbox_list": [ [ 0.0, 128.12, 133.02, 418.14 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: half bike far left.", "normal_caption": "half bike far left", "solution": [ 0.0, 128.12, 134.02, 419.14 ], "normalized_solution": [ 0, 300, 209, 983 ] }, { "height": 426, "width": 640, "id": 180, "original_id": 246698, "dataset_name": "refcoco", "area": 13749.793800000003, "iscrowd": 0, "image_id": 180, "category_id": 4, "bbox_list": [ [ 0.0, 128.12, 133.02, 418.14 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left corner.", "normal_caption": "bottom left corner", "solution": [ 0.0, 128.12, 134.02, 419.14 ], "normalized_solution": [ 0, 300, 209, 983 ] }, { "height": 426, "width": 640, "id": 181, "original_id": 245539, "dataset_name": "refcoco", "area": 17466.63315, "iscrowd": 0, "image_id": 181, "category_id": 4, "bbox_list": [ [ 367.6, 7.5, 510.20000000000005, 191.26 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: tire on blue motorcycle.", "normal_caption": "tire on blue motorcycle", "solution": [ 367.6, 7.5, 511.2, 192.26 ], "normalized_solution": [ 574, 17, 798, 451 ] }, { "height": 426, "width": 640, "id": 182, "original_id": 245539, "dataset_name": "refcoco", "area": 17466.63315, "iscrowd": 0, "image_id": 182, "category_id": 4, "bbox_list": [ [ 367.6, 7.5, 510.20000000000005, 191.26 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right bike in between white shirt and black shirt.", "normal_caption": "right bike in between white shirt and black shirt", "solution": [ 367.6, 7.5, 511.2, 192.26 ], "normalized_solution": [ 574, 17, 798, 451 ] }, { "height": 426, "width": 640, "id": 183, "original_id": 245539, "dataset_name": "refcoco", "area": 17466.63315, "iscrowd": 0, "image_id": 183, "category_id": 4, "bbox_list": [ [ 367.6, 7.5, 510.20000000000005, 191.26 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: on the back carrying.", "normal_caption": "on the back carrying", "solution": [ 367.6, 7.5, 511.2, 192.26 ], "normalized_solution": [ 574, 17, 798, 451 ] }, { "height": 426, "width": 640, "id": 184, "original_id": 215446, "dataset_name": "refcoco", "area": 23617.840750000003, "iscrowd": 0, "image_id": 184, "category_id": 1, "bbox_list": [ [ 437.57, 0.0, 639.0, 348.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right top white shirt.", "normal_caption": "right top white shirt", "solution": [ 437.57, 0.0, 640.0, 349.65 ], "normalized_solution": [ 683, 0, 1000, 820 ] }, { "height": 426, "width": 640, "id": 185, "original_id": 215446, "dataset_name": "refcoco", "area": 23617.840750000003, "iscrowd": 0, "image_id": 185, "category_id": 1, "bbox_list": [ [ 437.57, 0.0, 639.0, 348.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right top white shirt.", "normal_caption": "right top white shirt", "solution": [ 437.57, 0.0, 640.0, 349.65 ], "normalized_solution": [ 683, 0, 1000, 820 ] }, { "height": 426, "width": 640, "id": 186, "original_id": 215446, "dataset_name": "refcoco", "area": 23617.840750000003, "iscrowd": 0, "image_id": 186, "category_id": 1, "bbox_list": [ [ 437.57, 0.0, 639.0, 348.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in white.", "normal_caption": "man in white", "solution": [ 437.57, 0.0, 640.0, 349.65 ], "normalized_solution": [ 683, 0, 1000, 820 ] }, { "height": 426, "width": 640, "id": 187, "original_id": 202407, "dataset_name": "refcoco", "area": 30207.633699999995, "iscrowd": 0, "image_id": 187, "category_id": 1, "bbox_list": [ [ 543.05, 24.47, 638.9599999999999, 421.64 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right dark guy.", "normal_caption": "right dark guy", "solution": [ 543.05, 24.47, 639.96, 422.64 ], "normalized_solution": [ 848, 57, 999, 992 ] }, { "height": 426, "width": 640, "id": 188, "original_id": 202407, "dataset_name": "refcoco", "area": 30207.633699999995, "iscrowd": 0, "image_id": 188, "category_id": 1, "bbox_list": [ [ 543.05, 24.47, 638.9599999999999, 421.64 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black shape far right.", "normal_caption": "black shape far right", "solution": [ 543.05, 24.47, 639.96, 422.64 ], "normalized_solution": [ 848, 57, 999, 992 ] }, { "height": 426, "width": 640, "id": 189, "original_id": 202407, "dataset_name": "refcoco", "area": 30207.633699999995, "iscrowd": 0, "image_id": 189, "category_id": 1, "bbox_list": [ [ 543.05, 24.47, 638.9599999999999, 421.64 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581057.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black shirt right edge.", "normal_caption": "black shirt right edge", "solution": [ 543.05, 24.47, 639.96, 422.64 ], "normalized_solution": [ 848, 57, 999, 992 ] }, { "height": 427, "width": 640, "id": 190, "original_id": 591324, "dataset_name": "refcoco", "area": 33271.559799999995, "iscrowd": 0, "image_id": 190, "category_id": 24, "bbox_list": [ [ 149.94, 98.73, 439.18, 311.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581021.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: zebra closer to you.", "normal_caption": "zebra closer to you", "solution": [ 149.94, 98.73, 440.18, 312.16 ], "normalized_solution": [ 234, 231, 687, 731 ] }, { "height": 427, "width": 640, "id": 191, "original_id": 591324, "dataset_name": "refcoco", "area": 33271.559799999995, "iscrowd": 0, "image_id": 191, "category_id": 24, "bbox_list": [ [ 149.94, 98.73, 439.18, 311.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581021.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front zebra.", "normal_caption": "front zebra", "solution": [ 149.94, 98.73, 440.18, 312.16 ], "normalized_solution": [ 234, 231, 687, 731 ] }, { "height": 427, "width": 640, "id": 192, "original_id": 591324, "dataset_name": "refcoco", "area": 33271.559799999995, "iscrowd": 0, "image_id": 192, "category_id": 24, "bbox_list": [ [ 149.94, 98.73, 439.18, 311.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581021.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: zebra in the front.", "normal_caption": "zebra in the front", "solution": [ 149.94, 98.73, 440.18, 312.16 ], "normalized_solution": [ 234, 231, 687, 731 ] }, { "height": 427, "width": 640, "id": 193, "original_id": 589140, "dataset_name": "refcoco", "area": 16018.6149, "iscrowd": 0, "image_id": 193, "category_id": 24, "bbox_list": [ [ 344.77, 109.55, 564.53, 290.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581021.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: zebra on the right.", "normal_caption": "zebra on the right", "solution": [ 344.77, 109.55, 565.53, 291.85 ], "normalized_solution": [ 538, 256, 883, 683 ] }, { "height": 427, "width": 640, "id": 194, "original_id": 589140, "dataset_name": "refcoco", "area": 16018.6149, "iscrowd": 0, "image_id": 194, "category_id": 24, "bbox_list": [ [ 344.77, 109.55, 564.53, 290.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581021.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right zebra.", "normal_caption": "right zebra", "solution": [ 344.77, 109.55, 565.53, 291.85 ], "normalized_solution": [ 538, 256, 883, 683 ] }, { "height": 427, "width": 640, "id": 195, "original_id": 589140, "dataset_name": "refcoco", "area": 16018.6149, "iscrowd": 0, "image_id": 195, "category_id": 24, "bbox_list": [ [ 344.77, 109.55, 564.53, 290.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581021.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right zebra.", "normal_caption": "right zebra", "solution": [ 344.77, 109.55, 565.53, 291.85 ], "normalized_solution": [ 538, 256, 883, 683 ] }, { "height": 375, "width": 500, "id": 196, "original_id": 528547, "dataset_name": "refcoco", "area": 10754.266749999999, "iscrowd": 0, "image_id": 196, "category_id": 1, "bbox_list": [ [ 135.98, 45.61, 256.6, 285.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 135.98, 45.61, 257.6, 286.32 ], "normalized_solution": [ 271, 121, 515, 763 ] }, { "height": 375, "width": 500, "id": 197, "original_id": 528547, "dataset_name": "refcoco", "area": 10754.266749999999, "iscrowd": 0, "image_id": 197, "category_id": 1, "bbox_list": [ [ 135.98, 45.61, 256.6, 285.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl on skateboard.", "normal_caption": "girl on skateboard", "solution": [ 135.98, 45.61, 257.6, 286.32 ], "normalized_solution": [ 271, 121, 515, 763 ] }, { "height": 375, "width": 500, "id": 198, "original_id": 528547, "dataset_name": "refcoco", "area": 10754.266749999999, "iscrowd": 0, "image_id": 198, "category_id": 1, "bbox_list": [ [ 135.98, 45.61, 256.6, 285.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink shirt.", "normal_caption": "pink shirt", "solution": [ 135.98, 45.61, 257.6, 286.32 ], "normalized_solution": [ 271, 121, 515, 763 ] }, { "height": 375, "width": 500, "id": 199, "original_id": 489887, "dataset_name": "refcoco", "area": 12464.597600000003, "iscrowd": 0, "image_id": 199, "category_id": 1, "bbox_list": [ [ 44.64, 26.56, 159.19, 286.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on left.", "normal_caption": "man on left", "solution": [ 44.64, 26.56, 160.19, 287.18 ], "normalized_solution": [ 89, 70, 320, 765 ] }, { "height": 375, "width": 500, "id": 200, "original_id": 489887, "dataset_name": "refcoco", "area": 12464.597600000003, "iscrowd": 0, "image_id": 200, "category_id": 1, "bbox_list": [ [ 44.64, 26.56, 159.19, 286.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy.", "normal_caption": "boy", "solution": [ 44.64, 26.56, 160.19, 287.18 ], "normalized_solution": [ 89, 70, 320, 765 ] }, { "height": 375, "width": 500, "id": 201, "original_id": 489887, "dataset_name": "refcoco", "area": 12464.597600000003, "iscrowd": 0, "image_id": 201, "category_id": 1, "bbox_list": [ [ 44.64, 26.56, 159.19, 286.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000581009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in white.", "normal_caption": "man in white", "solution": [ 44.64, 26.56, 160.19, 287.18 ], "normalized_solution": [ 89, 70, 320, 765 ] }, { "height": 427, "width": 640, "id": 202, "original_id": 480045, "dataset_name": "refcoco", "area": 14907.269749999992, "iscrowd": 0, "image_id": 202, "category_id": 1, "bbox_list": [ [ 95.64, 115.77, 233.92000000000002, 329.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in scarf.", "normal_caption": "woman in scarf", "solution": [ 95.64, 115.77, 234.92, 330.25 ], "normalized_solution": [ 149, 271, 367, 773 ] }, { "height": 427, "width": 640, "id": 203, "original_id": 480045, "dataset_name": "refcoco", "area": 14907.269749999992, "iscrowd": 0, "image_id": 203, "category_id": 1, "bbox_list": [ [ 95.64, 115.77, 233.92000000000002, 329.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on the left white scard.", "normal_caption": "woman on the left white scard", "solution": [ 95.64, 115.77, 234.92, 330.25 ], "normalized_solution": [ 149, 271, 367, 773 ] }, { "height": 427, "width": 640, "id": 204, "original_id": 480045, "dataset_name": "refcoco", "area": 14907.269749999992, "iscrowd": 0, "image_id": 204, "category_id": 1, "bbox_list": [ [ 95.64, 115.77, 233.92000000000002, 329.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman with scarf.", "normal_caption": "woman with scarf", "solution": [ 95.64, 115.77, 234.92, 330.25 ], "normalized_solution": [ 149, 271, 367, 773 ] }, { "height": 427, "width": 640, "id": 205, "original_id": 460124, "dataset_name": "refcoco", "area": 21105.55065000001, "iscrowd": 0, "image_id": 205, "category_id": 1, "bbox_list": [ [ 454.7, 98.48, 571.2, 425.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady on the right.", "normal_caption": "lady on the right", "solution": [ 454.7, 98.48, 572.2, 426.22 ], "normalized_solution": [ 710, 230, 894, 998 ] }, { "height": 427, "width": 640, "id": 206, "original_id": 460124, "dataset_name": "refcoco", "area": 21105.55065000001, "iscrowd": 0, "image_id": 206, "category_id": 1, "bbox_list": [ [ 454.7, 98.48, 571.2, 425.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman next to man.", "normal_caption": "woman next to man", "solution": [ 454.7, 98.48, 572.2, 426.22 ], "normalized_solution": [ 710, 230, 894, 998 ] }, { "height": 427, "width": 640, "id": 207, "original_id": 460124, "dataset_name": "refcoco", "area": 21105.55065000001, "iscrowd": 0, "image_id": 207, "category_id": 1, "bbox_list": [ [ 454.7, 98.48, 571.2, 425.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady with glasses.", "normal_caption": "lady with glasses", "solution": [ 454.7, 98.48, 572.2, 426.22 ], "normalized_solution": [ 710, 230, 894, 998 ] }, { "height": 427, "width": 640, "id": 208, "original_id": 439008, "dataset_name": "refcoco", "area": 43051.94235000002, "iscrowd": 0, "image_id": 208, "category_id": 1, "bbox_list": [ [ 351.99, 74.05, 516.4, 425.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 351.99, 74.05, 517.4, 426.04 ], "normalized_solution": [ 549, 173, 808, 997 ] }, { "height": 427, "width": 640, "id": 209, "original_id": 439008, "dataset_name": "refcoco", "area": 43051.94235000002, "iscrowd": 0, "image_id": 209, "category_id": 1, "bbox_list": [ [ 351.99, 74.05, 516.4, 425.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in blue and red jacket.", "normal_caption": "man in blue and red jacket", "solution": [ 351.99, 74.05, 517.4, 426.04 ], "normalized_solution": [ 549, 173, 808, 997 ] }, { "height": 427, "width": 640, "id": 210, "original_id": 439008, "dataset_name": "refcoco", "area": 43051.94235000002, "iscrowd": 0, "image_id": 210, "category_id": 1, "bbox_list": [ [ 351.99, 74.05, 516.4, 425.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580945.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in blue jacket with red sleeves.", "normal_caption": "man in blue jacket with red sleeves", "solution": [ 351.99, 74.05, 517.4, 426.04 ], "normalized_solution": [ 549, 173, 808, 997 ] }, { "height": 640, "width": 597, "id": 211, "original_id": 1207959, "dataset_name": "refcoco", "area": 20363.782549999996, "iscrowd": 0, "image_id": 211, "category_id": 1, "bbox_list": [ [ 291.14, 219.99, 402.46999999999997, 588.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580919.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person with backpackdont click the bag click the person.", "normal_caption": "person with backpackdont click the bag click the person", "solution": [ 291.14, 219.99, 403.47, 589.81 ], "normalized_solution": [ 487, 343, 675, 921 ] }, { "height": 640, "width": 597, "id": 212, "original_id": 1207959, "dataset_name": "refcoco", "area": 20363.782549999996, "iscrowd": 0, "image_id": 212, "category_id": 1, "bbox_list": [ [ 291.14, 219.99, 402.46999999999997, 588.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580919.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: biege shorts.", "normal_caption": "biege shorts", "solution": [ 291.14, 219.99, 403.47, 589.81 ], "normalized_solution": [ 487, 343, 675, 921 ] }, { "height": 640, "width": 597, "id": 213, "original_id": 1207959, "dataset_name": "refcoco", "area": 20363.782549999996, "iscrowd": 0, "image_id": 213, "category_id": 1, "bbox_list": [ [ 291.14, 219.99, 402.46999999999997, 588.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580919.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man walking dog.", "normal_caption": "man walking dog", "solution": [ 291.14, 219.99, 403.47, 589.81 ], "normalized_solution": [ 487, 343, 675, 921 ] }, { "height": 427, "width": 640, "id": 214, "original_id": 2117621, "dataset_name": "refcoco", "area": 27308.349050000004, "iscrowd": 0, "image_id": 214, "category_id": 59, "bbox_list": [ [ 464.61, 237.97, 639.0, 420.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580913.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: food to right of pizza.", "normal_caption": "food to right of pizza", "solution": [ 464.61, 237.97, 640.0, 421.6 ], "normalized_solution": [ 725, 557, 1000, 987 ] }, { "height": 427, "width": 640, "id": 215, "original_id": 2117621, "dataset_name": "refcoco", "area": 27308.349050000004, "iscrowd": 0, "image_id": 215, "category_id": 59, "bbox_list": [ [ 464.61, 237.97, 639.0, 420.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580913.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: food towards right edge.", "normal_caption": "food towards right edge", "solution": [ 464.61, 237.97, 640.0, 421.6 ], "normalized_solution": [ 725, 557, 1000, 987 ] }, { "height": 427, "width": 640, "id": 216, "original_id": 2117621, "dataset_name": "refcoco", "area": 27308.349050000004, "iscrowd": 0, "image_id": 216, "category_id": 59, "bbox_list": [ [ 464.61, 237.97, 639.0, 420.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580913.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right slice.", "normal_caption": "right slice", "solution": [ 464.61, 237.97, 640.0, 421.6 ], "normalized_solution": [ 725, 557, 1000, 987 ] }, { "height": 427, "width": 640, "id": 217, "original_id": 1072388, "dataset_name": "refcoco", "area": 93212.6849, "iscrowd": 0, "image_id": 217, "category_id": 59, "bbox_list": [ [ 118.02, 0.0, 490.28999999999996, 421.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580913.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: food being held.", "normal_caption": "food being held", "solution": [ 118.02, 0.0, 491.29, 422.2 ], "normalized_solution": [ 184, 0, 767, 988 ] }, { "height": 427, "width": 640, "id": 218, "original_id": 1072388, "dataset_name": "refcoco", "area": 93212.6849, "iscrowd": 0, "image_id": 218, "category_id": 59, "bbox_list": [ [ 118.02, 0.0, 490.28999999999996, 421.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580913.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: food in hand.", "normal_caption": "food in hand", "solution": [ 118.02, 0.0, 491.29, 422.2 ], "normalized_solution": [ 184, 0, 767, 988 ] }, { "height": 427, "width": 640, "id": 219, "original_id": 1072388, "dataset_name": "refcoco", "area": 93212.6849, "iscrowd": 0, "image_id": 219, "category_id": 59, "bbox_list": [ [ 118.02, 0.0, 490.28999999999996, 421.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580913.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bread slice.", "normal_caption": "bread slice", "solution": [ 118.02, 0.0, 491.29, 422.2 ], "normalized_solution": [ 184, 0, 767, 988 ] }, { "height": 640, "width": 480, "id": 220, "original_id": 343754, "dataset_name": "refcoco", "area": 11753.676849999996, "iscrowd": 0, "image_id": 220, "category_id": 90, "bbox_list": [ [ 336.22, 82.11, 479.0, 415.7 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right toothbrush.", "normal_caption": "far right toothbrush", "solution": [ 336.22, 82.11, 480.0, 416.7 ], "normalized_solution": [ 700, 128, 1000, 651 ] }, { "height": 640, "width": 480, "id": 221, "original_id": 343754, "dataset_name": "refcoco", "area": 11753.676849999996, "iscrowd": 0, "image_id": 221, "category_id": 90, "bbox_list": [ [ 336.22, 82.11, 479.0, 415.7 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the furthest toothbrush to the right.", "normal_caption": "the furthest toothbrush to the right", "solution": [ 336.22, 82.11, 480.0, 416.7 ], "normalized_solution": [ 700, 128, 1000, 651 ] }, { "height": 640, "width": 480, "id": 222, "original_id": 343754, "dataset_name": "refcoco", "area": 11753.676849999996, "iscrowd": 0, "image_id": 222, "category_id": 90, "bbox_list": [ [ 336.22, 82.11, 479.0, 415.7 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: most right brush in the back.", "normal_caption": "most right brush in the back", "solution": [ 336.22, 82.11, 480.0, 416.7 ], "normalized_solution": [ 700, 128, 1000, 651 ] }, { "height": 640, "width": 480, "id": 223, "original_id": 343558, "dataset_name": "refcoco", "area": 18122.564799999996, "iscrowd": 0, "image_id": 223, "category_id": 90, "bbox_list": [ [ 280.79, 64.36, 425.19000000000005, 423.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: first toothbrush on the right.", "normal_caption": "first toothbrush on the right", "solution": [ 280.79, 64.36, 426.19, 424.06 ], "normalized_solution": [ 584, 100, 887, 662 ] }, { "height": 640, "width": 480, "id": 224, "original_id": 343558, "dataset_name": "refcoco", "area": 18122.564799999996, "iscrowd": 0, "image_id": 224, "category_id": 90, "bbox_list": [ [ 280.79, 64.36, 425.19000000000005, 423.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second from right brush.", "normal_caption": "second from right brush", "solution": [ 280.79, 64.36, 426.19, 424.06 ], "normalized_solution": [ 584, 100, 887, 662 ] }, { "height": 640, "width": 480, "id": 225, "original_id": 343558, "dataset_name": "refcoco", "area": 18122.564799999996, "iscrowd": 0, "image_id": 225, "category_id": 90, "bbox_list": [ [ 280.79, 64.36, 425.19000000000005, 423.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second brush from the right.", "normal_caption": "second brush from the right", "solution": [ 280.79, 64.36, 426.19, 424.06 ], "normalized_solution": [ 584, 100, 887, 662 ] }, { "height": 640, "width": 480, "id": 226, "original_id": 343179, "dataset_name": "refcoco", "area": 15988.592700000001, "iscrowd": 0, "image_id": 226, "category_id": 90, "bbox_list": [ [ 138.42, 93.42, 239.44, 424.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: toothbrush in center with yellow bristles.", "normal_caption": "toothbrush in center with yellow bristles", "solution": [ 138.42, 93.42, 240.44, 425.07 ], "normalized_solution": [ 288, 145, 500, 664 ] }, { "height": 640, "width": 480, "id": 227, "original_id": 343179, "dataset_name": "refcoco", "area": 15988.592700000001, "iscrowd": 0, "image_id": 227, "category_id": 90, "bbox_list": [ [ 138.42, 93.42, 239.44, 424.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle toothbrush.", "normal_caption": "middle toothbrush", "solution": [ 138.42, 93.42, 240.44, 425.07 ], "normalized_solution": [ 288, 145, 500, 664 ] }, { "height": 640, "width": 480, "id": 228, "original_id": 343179, "dataset_name": "refcoco", "area": 15988.592700000001, "iscrowd": 0, "image_id": 228, "category_id": 90, "bbox_list": [ [ 138.42, 93.42, 239.44, 424.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: yellow toothbrush.", "normal_caption": "yellow toothbrush", "solution": [ 138.42, 93.42, 240.44, 425.07 ], "normalized_solution": [ 288, 145, 500, 664 ] }, { "height": 640, "width": 480, "id": 229, "original_id": 342398, "dataset_name": "refcoco", "area": 18493.616649999993, "iscrowd": 0, "image_id": 229, "category_id": 90, "bbox_list": [ [ 21.57, 59.97, 191.72, 424.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: toothbrush second from left.", "normal_caption": "toothbrush second from left", "solution": [ 21.57, 59.97, 192.72, 425.27 ], "normalized_solution": [ 44, 93, 401, 664 ] }, { "height": 640, "width": 480, "id": 230, "original_id": 342398, "dataset_name": "refcoco", "area": 18493.616649999993, "iscrowd": 0, "image_id": 230, "category_id": 90, "bbox_list": [ [ 21.57, 59.97, 191.72, 424.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brush second from left.", "normal_caption": "brush second from left", "solution": [ 21.57, 59.97, 192.72, 425.27 ], "normalized_solution": [ 44, 93, 401, 664 ] }, { "height": 640, "width": 480, "id": 231, "original_id": 342398, "dataset_name": "refcoco", "area": 18493.616649999993, "iscrowd": 0, "image_id": 231, "category_id": 90, "bbox_list": [ [ 21.57, 59.97, 191.72, 424.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580851.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: toothbrush front left.", "normal_caption": "toothbrush front left", "solution": [ 21.57, 59.97, 192.72, 425.27 ], "normalized_solution": [ 44, 93, 401, 664 ] }, { "height": 429, "width": 640, "id": 232, "original_id": 2191253, "dataset_name": "refcoco", "area": 70079.11910000001, "iscrowd": 0, "image_id": 232, "category_id": 1, "bbox_list": [ [ 184.97, 0.0, 461.42999999999995, 421.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy wpurple tie.", "normal_caption": "boy wpurple tie", "solution": [ 184.97, 0.0, 462.43, 422.31 ], "normalized_solution": [ 289, 0, 722, 984 ] }, { "height": 429, "width": 640, "id": 233, "original_id": 2191253, "dataset_name": "refcoco", "area": 70079.11910000001, "iscrowd": 0, "image_id": 233, "category_id": 1, "bbox_list": [ [ 184.97, 0.0, 461.42999999999995, 421.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: purple tie.", "normal_caption": "purple tie", "solution": [ 184.97, 0.0, 462.43, 422.31 ], "normalized_solution": [ 289, 0, 722, 984 ] }, { "height": 429, "width": 640, "id": 234, "original_id": 2191253, "dataset_name": "refcoco", "area": 70079.11910000001, "iscrowd": 0, "image_id": 234, "category_id": 1, "bbox_list": [ [ 184.97, 0.0, 461.42999999999995, 421.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle kid purple tie.", "normal_caption": "middle kid purple tie", "solution": [ 184.97, 0.0, 462.43, 422.31 ], "normalized_solution": [ 289, 0, 722, 984 ] }, { "height": 429, "width": 640, "id": 235, "original_id": 2191061, "dataset_name": "refcoco", "area": 38066.69175, "iscrowd": 0, "image_id": 235, "category_id": 1, "bbox_list": [ [ 391.11, 35.66, 575.09, 415.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy with blue tie blond hair.", "normal_caption": "boy with blue tie blond hair", "solution": [ 391.11, 35.66, 576.09, 416.74 ], "normalized_solution": [ 611, 83, 900, 971 ] }, { "height": 429, "width": 640, "id": 236, "original_id": 2191061, "dataset_name": "refcoco", "area": 38066.69175, "iscrowd": 0, "image_id": 236, "category_id": 1, "bbox_list": [ [ 391.11, 35.66, 575.09, 415.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blondie boy with blue tie.", "normal_caption": "blondie boy with blue tie", "solution": [ 391.11, 35.66, 576.09, 416.74 ], "normalized_solution": [ 611, 83, 900, 971 ] }, { "height": 429, "width": 640, "id": 237, "original_id": 2158396, "dataset_name": "refcoco", "area": 37183.33295, "iscrowd": 0, "image_id": 237, "category_id": 1, "bbox_list": [ [ 459.09, 111.43, 639.0, 421.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blond hair close to us on right.", "normal_caption": "blond hair close to us on right", "solution": [ 459.09, 111.43, 640.0, 422.31 ], "normalized_solution": [ 717, 259, 1000, 984 ] }, { "height": 429, "width": 640, "id": 238, "original_id": 2158396, "dataset_name": "refcoco", "area": 37183.33295, "iscrowd": 0, "image_id": 238, "category_id": 1, "bbox_list": [ [ 459.09, 111.43, 639.0, 421.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hair in front.", "normal_caption": "hair in front", "solution": [ 459.09, 111.43, 640.0, 422.31 ], "normalized_solution": [ 717, 259, 1000, 984 ] }, { "height": 429, "width": 640, "id": 239, "original_id": 1729858, "dataset_name": "refcoco", "area": 10553.794749999997, "iscrowd": 0, "image_id": 239, "category_id": 1, "bbox_list": [ [ 77.39, 77.98, 187.45999999999998, 279.46 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: first boy from the left.", "normal_caption": "first boy from the left", "solution": [ 77.39, 77.98, 188.46, 280.46 ], "normalized_solution": [ 120, 181, 294, 653 ] }, { "height": 429, "width": 640, "id": 240, "original_id": 1729858, "dataset_name": "refcoco", "area": 10553.794749999997, "iscrowd": 0, "image_id": 240, "category_id": 1, "bbox_list": [ [ 77.39, 77.98, 187.45999999999998, 279.46 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left man.", "normal_caption": "left man", "solution": [ 77.39, 77.98, 188.46, 280.46 ], "normalized_solution": [ 120, 181, 294, 653 ] }, { "height": 429, "width": 640, "id": 241, "original_id": 539594, "dataset_name": "refcoco", "area": 33703.927899999995, "iscrowd": 0, "image_id": 241, "category_id": 1, "bbox_list": [ [ 85.22, 14.77, 286.61, 337.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl next to blazer guy.", "normal_caption": "girl next to blazer guy", "solution": [ 85.22, 14.77, 287.61, 338.21 ], "normalized_solution": [ 133, 34, 449, 788 ] }, { "height": 429, "width": 640, "id": 242, "original_id": 539594, "dataset_name": "refcoco", "area": 33703.927899999995, "iscrowd": 0, "image_id": 242, "category_id": 1, "bbox_list": [ [ 85.22, 14.77, 286.61, 337.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person with one rose.", "normal_caption": "person with one rose", "solution": [ 85.22, 14.77, 287.61, 338.21 ], "normalized_solution": [ 133, 34, 449, 788 ] }, { "height": 429, "width": 640, "id": 243, "original_id": 539594, "dataset_name": "refcoco", "area": 33703.927899999995, "iscrowd": 0, "image_id": 243, "category_id": 1, "bbox_list": [ [ 85.22, 14.77, 286.61, 337.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580849.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second girl from left.", "normal_caption": "second girl from left", "solution": [ 85.22, 14.77, 287.61, 338.21 ], "normalized_solution": [ 133, 34, 449, 788 ] }, { "height": 426, "width": 640, "id": 244, "original_id": 1938201, "dataset_name": "refcoco", "area": 64253.211000000025, "iscrowd": 0, "image_id": 244, "category_id": 62, "bbox_list": [ [ 402.84, 0.81, 639.0, 425.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580843.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lol right seat.", "normal_caption": "lol right seat", "solution": [ 402.84, 0.81, 640.0, 426.0 ], "normalized_solution": [ 629, 1, 1000, 1000 ] }, { "height": 426, "width": 640, "id": 245, "original_id": 1938201, "dataset_name": "refcoco", "area": 64253.211000000025, "iscrowd": 0, "image_id": 245, "category_id": 62, "bbox_list": [ [ 402.84, 0.81, 639.0, 425.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580843.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right seat.", "normal_caption": "right seat", "solution": [ 402.84, 0.81, 640.0, 426.0 ], "normalized_solution": [ 629, 1, 1000, 1000 ] }, { "height": 426, "width": 640, "id": 246, "original_id": 1938201, "dataset_name": "refcoco", "area": 64253.211000000025, "iscrowd": 0, "image_id": 246, "category_id": 62, "bbox_list": [ [ 402.84, 0.81, 639.0, 425.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580843.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: seat on right.", "normal_caption": "seat on right", "solution": [ 402.84, 0.81, 640.0, 426.0 ], "normalized_solution": [ 629, 1, 1000, 1000 ] }, { "height": 426, "width": 640, "id": 247, "original_id": 1600280, "dataset_name": "refcoco", "area": 18767.495000000003, "iscrowd": 0, "image_id": 247, "category_id": 62, "bbox_list": [ [ 34.46, 1.91, 373.31, 419.26000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580843.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue seat on left.", "normal_caption": "blue seat on left", "solution": [ 34.46, 1.91, 374.31, 420.26 ], "normalized_solution": [ 53, 4, 584, 986 ] }, { "height": 426, "width": 640, "id": 248, "original_id": 1600280, "dataset_name": "refcoco", "area": 18767.495000000003, "iscrowd": 0, "image_id": 248, "category_id": 62, "bbox_list": [ [ 34.46, 1.91, 373.31, 419.26000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580843.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: click the seat just above suitcase handle.", "normal_caption": "click the seat just above suitcase handle", "solution": [ 34.46, 1.91, 374.31, 420.26 ], "normalized_solution": [ 53, 4, 584, 986 ] }, { "height": 426, "width": 640, "id": 249, "original_id": 1600280, "dataset_name": "refcoco", "area": 18767.495000000003, "iscrowd": 0, "image_id": 249, "category_id": 62, "bbox_list": [ [ 34.46, 1.91, 373.31, 419.26000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580843.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the seat were the bag is.", "normal_caption": "the seat were the bag is", "solution": [ 34.46, 1.91, 374.31, 420.26 ], "normalized_solution": [ 53, 4, 584, 986 ] }, { "height": 480, "width": 640, "id": 250, "original_id": 2167429, "dataset_name": "refcoco", "area": 17023.7504, "iscrowd": 0, "image_id": 250, "category_id": 1, "bbox_list": [ [ 0.0, 141.43, 78.23, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: mans arm in far left.", "normal_caption": "mans arm in far left", "solution": [ 0.0, 141.43, 79.23, 480.0 ], "normalized_solution": [ 0, 294, 123, 1000 ] }, { "height": 480, "width": 640, "id": 251, "original_id": 2167429, "dataset_name": "refcoco", "area": 17023.7504, "iscrowd": 0, "image_id": 251, "category_id": 1, "bbox_list": [ [ 0.0, 141.43, 78.23, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far left partial person.", "normal_caption": "far left partial person", "solution": [ 0.0, 141.43, 79.23, 480.0 ], "normalized_solution": [ 0, 294, 123, 1000 ] }, { "height": 480, "width": 640, "id": 252, "original_id": 1709642, "dataset_name": "refcoco", "area": 62088.4215, "iscrowd": 0, "image_id": 252, "category_id": 1, "bbox_list": [ [ 26.97, 119.73, 309.65, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man with blue shirt.", "normal_caption": "man with blue shirt", "solution": [ 26.97, 119.73, 310.65, 474.61 ], "normalized_solution": [ 42, 249, 485, 988 ] }, { "height": 480, "width": 640, "id": 253, "original_id": 1709642, "dataset_name": "refcoco", "area": 62088.4215, "iscrowd": 0, "image_id": 253, "category_id": 1, "bbox_list": [ [ 26.97, 119.73, 309.65, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left tie guy.", "normal_caption": "left tie guy", "solution": [ 26.97, 119.73, 310.65, 474.61 ], "normalized_solution": [ 42, 249, 485, 988 ] }, { "height": 480, "width": 640, "id": 254, "original_id": 1709642, "dataset_name": "refcoco", "area": 62088.4215, "iscrowd": 0, "image_id": 254, "category_id": 1, "bbox_list": [ [ 26.97, 119.73, 309.65, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left male.", "normal_caption": "left male", "solution": [ 26.97, 119.73, 310.65, 474.61 ], "normalized_solution": [ 42, 249, 485, 988 ] }, { "height": 480, "width": 640, "id": 255, "original_id": 422824, "dataset_name": "refcoco", "area": 67823.18304999999, "iscrowd": 0, "image_id": 255, "category_id": 1, "bbox_list": [ [ 261.13, 133.0, 544.01, 471.14 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right guy.", "normal_caption": "right guy", "solution": [ 261.13, 133.0, 545.01, 472.14 ], "normalized_solution": [ 408, 277, 851, 983 ] }, { "height": 480, "width": 640, "id": 256, "original_id": 422824, "dataset_name": "refcoco", "area": 67823.18304999999, "iscrowd": 0, "image_id": 256, "category_id": 1, "bbox_list": [ [ 261.13, 133.0, 544.01, 471.14 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right guy facing camera.", "normal_caption": "right guy facing camera", "solution": [ 261.13, 133.0, 545.01, 472.14 ], "normalized_solution": [ 408, 277, 851, 983 ] }, { "height": 480, "width": 640, "id": 257, "original_id": 422824, "dataset_name": "refcoco", "area": 67823.18304999999, "iscrowd": 0, "image_id": 257, "category_id": 1, "bbox_list": [ [ 261.13, 133.0, 544.01, 471.14 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580837.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on right.", "normal_caption": "guy on right", "solution": [ 261.13, 133.0, 545.01, 472.14 ], "normalized_solution": [ 408, 277, 851, 983 ] }, { "height": 368, "width": 640, "id": 258, "original_id": 113265, "dataset_name": "refcoco", "area": 10071.0308, "iscrowd": 0, "image_id": 258, "category_id": 63, "bbox_list": [ [ 373.89, 141.9, 592.18, 299.62 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580741.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the couch the two are sitting on.", "normal_caption": "the couch the two are sitting on", "solution": [ 373.89, 141.9, 593.18, 300.62 ], "normalized_solution": [ 584, 385, 926, 816 ] }, { "height": 368, "width": 640, "id": 259, "original_id": 113265, "dataset_name": "refcoco", "area": 10071.0308, "iscrowd": 0, "image_id": 259, "category_id": 63, "bbox_list": [ [ 373.89, 141.9, 592.18, 299.62 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580741.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brown sofa at right where two goofy kids are sitting.", "normal_caption": "brown sofa at right where two goofy kids are sitting", "solution": [ 373.89, 141.9, 593.18, 300.62 ], "normalized_solution": [ 584, 385, 926, 816 ] }, { "height": 368, "width": 640, "id": 260, "original_id": 113265, "dataset_name": "refcoco", "area": 10071.0308, "iscrowd": 0, "image_id": 260, "category_id": 63, "bbox_list": [ [ 373.89, 141.9, 592.18, 299.62 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580741.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch right.", "normal_caption": "couch right", "solution": [ 373.89, 141.9, 593.18, 300.62 ], "normalized_solution": [ 584, 385, 926, 816 ] }, { "height": 368, "width": 640, "id": 261, "original_id": 99480, "dataset_name": "refcoco", "area": 14632.6631, "iscrowd": 0, "image_id": 261, "category_id": 63, "bbox_list": [ [ 0.0, 143.53, 296.11, 334.86 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580741.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch on left.", "normal_caption": "couch on left", "solution": [ 0.0, 143.53, 297.11, 335.86 ], "normalized_solution": [ 0, 390, 464, 912 ] }, { "height": 368, "width": 640, "id": 262, "original_id": 99480, "dataset_name": "refcoco", "area": 14632.6631, "iscrowd": 0, "image_id": 262, "category_id": 63, "bbox_list": [ [ 0.0, 143.53, 296.11, 334.86 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580741.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red couch.", "normal_caption": "red couch", "solution": [ 0.0, 143.53, 297.11, 335.86 ], "normalized_solution": [ 0, 390, 464, 912 ] }, { "height": 368, "width": 640, "id": 263, "original_id": 99480, "dataset_name": "refcoco", "area": 14632.6631, "iscrowd": 0, "image_id": 263, "category_id": 63, "bbox_list": [ [ 0.0, 143.53, 296.11, 334.86 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580741.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red couch on the left.", "normal_caption": "red couch on the left", "solution": [ 0.0, 143.53, 297.11, 335.86 ], "normalized_solution": [ 0, 390, 464, 912 ] }, { "height": 428, "width": 640, "id": 264, "original_id": 1058774, "dataset_name": "refcoco", "area": 20818.235299999997, "iscrowd": 0, "image_id": 264, "category_id": 56, "bbox_list": [ [ 461.23, 235.65, 639.0, 424.99 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: ummthe food in the bottom right corner i wouldnt eat it.", "normal_caption": "ummthe food in the bottom right corner i wouldnt eat it", "solution": [ 461.23, 235.65, 640.0, 425.99 ], "normalized_solution": [ 720, 550, 1000, 995 ] }, { "height": 428, "width": 640, "id": 265, "original_id": 1058774, "dataset_name": "refcoco", "area": 20818.235299999997, "iscrowd": 0, "image_id": 265, "category_id": 56, "bbox_list": [ [ 461.23, 235.65, 639.0, 424.99 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lower right hand corner of pic the piece of upside down broccoli.", "normal_caption": "lower right hand corner of pic the piece of upside down broccoli", "solution": [ 461.23, 235.65, 640.0, 425.99 ], "normalized_solution": [ 720, 550, 1000, 995 ] }, { "height": 428, "width": 640, "id": 266, "original_id": 1058774, "dataset_name": "refcoco", "area": 20818.235299999997, "iscrowd": 0, "image_id": 266, "category_id": 56, "bbox_list": [ [ 461.23, 235.65, 639.0, 424.99 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brocli on right.", "normal_caption": "brocli on right", "solution": [ 461.23, 235.65, 640.0, 425.99 ], "normalized_solution": [ 720, 550, 1000, 995 ] }, { "height": 428, "width": 640, "id": 267, "original_id": 1055111, "dataset_name": "refcoco", "area": 33027.766899999995, "iscrowd": 0, "image_id": 267, "category_id": 56, "bbox_list": [ [ 140.99, 243.59, 394.77, 415.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccoli near you.", "normal_caption": "broccoli near you", "solution": [ 140.99, 243.59, 395.77, 416.8 ], "normalized_solution": [ 220, 569, 618, 973 ] }, { "height": 428, "width": 640, "id": 268, "original_id": 1055111, "dataset_name": "refcoco", "area": 33027.766899999995, "iscrowd": 0, "image_id": 268, "category_id": 56, "bbox_list": [ [ 140.99, 243.59, 394.77, 415.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: piece of broccoli that is in the middle towards bottom of screen.", "normal_caption": "piece of broccoli that is in the middle towards bottom of screen", "solution": [ 140.99, 243.59, 395.77, 416.8 ], "normalized_solution": [ 220, 569, 618, 973 ] }, { "height": 428, "width": 640, "id": 269, "original_id": 1055111, "dataset_name": "refcoco", "area": 33027.766899999995, "iscrowd": 0, "image_id": 269, "category_id": 56, "bbox_list": [ [ 140.99, 243.59, 394.77, 415.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front broccoli.", "normal_caption": "front broccoli", "solution": [ 140.99, 243.59, 395.77, 416.8 ], "normalized_solution": [ 220, 569, 618, 973 ] }, { "height": 640, "width": 531, "id": 270, "original_id": 2205911, "dataset_name": "refcoco", "area": 51304.46600000001, "iscrowd": 0, "image_id": 270, "category_id": 1, "bbox_list": [ [ 263.24, 60.27, 508.96000000000004, 587.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580695.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right girl.", "normal_caption": "right girl", "solution": [ 263.24, 60.27, 509.96, 588.89 ], "normalized_solution": [ 495, 94, 960, 920 ] }, { "height": 640, "width": 531, "id": 271, "original_id": 2205911, "dataset_name": "refcoco", "area": 51304.46600000001, "iscrowd": 0, "image_id": 271, "category_id": 1, "bbox_list": [ [ 263.24, 60.27, 508.96000000000004, 587.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580695.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl right.", "normal_caption": "girl right", "solution": [ 263.24, 60.27, 509.96, 588.89 ], "normalized_solution": [ 495, 94, 960, 920 ] }, { "height": 640, "width": 531, "id": 272, "original_id": 2205911, "dataset_name": "refcoco", "area": 51304.46600000001, "iscrowd": 0, "image_id": 272, "category_id": 1, "bbox_list": [ [ 263.24, 60.27, 508.96000000000004, 587.89 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580695.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the girl in white.", "normal_caption": "the girl in white", "solution": [ 263.24, 60.27, 509.96, 588.89 ], "normalized_solution": [ 495, 94, 960, 920 ] }, { "height": 640, "width": 531, "id": 273, "original_id": 456832, "dataset_name": "refcoco", "area": 56095.65149999999, "iscrowd": 0, "image_id": 273, "category_id": 1, "bbox_list": [ [ 98.02, 9.8, 287.29, 575.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580695.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl wearing red.", "normal_caption": "girl wearing red", "solution": [ 98.02, 9.8, 288.29, 576.29 ], "normalized_solution": [ 184, 15, 542, 900 ] }, { "height": 640, "width": 531, "id": 274, "original_id": 456832, "dataset_name": "refcoco", "area": 56095.65149999999, "iscrowd": 0, "image_id": 274, "category_id": 1, "bbox_list": [ [ 98.02, 9.8, 287.29, 575.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580695.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: in red.", "normal_caption": "in red", "solution": [ 98.02, 9.8, 288.29, 576.29 ], "normalized_solution": [ 184, 15, 542, 900 ] }, { "height": 640, "width": 531, "id": 275, "original_id": 456832, "dataset_name": "refcoco", "area": 56095.65149999999, "iscrowd": 0, "image_id": 275, "category_id": 1, "bbox_list": [ [ 98.02, 9.8, 287.29, 575.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580695.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red shirt.", "normal_caption": "red shirt", "solution": [ 98.02, 9.8, 288.29, 576.29 ], "normalized_solution": [ 184, 15, 542, 900 ] }, { "height": 480, "width": 640, "id": 276, "original_id": 1088025, "dataset_name": "refcoco", "area": 16102.366600000003, "iscrowd": 0, "image_id": 276, "category_id": 61, "bbox_list": [ [ 389.39, 136.99, 517.8299999999999, 302.1 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white frosting pile on right.", "normal_caption": "white frosting pile on right", "solution": [ 389.39, 136.99, 518.83, 303.1 ], "normalized_solution": [ 608, 285, 810, 631 ] }, { "height": 480, "width": 640, "id": 277, "original_id": 1088025, "dataset_name": "refcoco", "area": 16102.366600000003, "iscrowd": 0, "image_id": 277, "category_id": 61, "bbox_list": [ [ 389.39, 136.99, 517.8299999999999, 302.1 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white object on plate.", "normal_caption": "white object on plate", "solution": [ 389.39, 136.99, 518.83, 303.1 ], "normalized_solution": [ 608, 285, 810, 631 ] }, { "height": 480, "width": 640, "id": 278, "original_id": 1088025, "dataset_name": "refcoco", "area": 16102.366600000003, "iscrowd": 0, "image_id": 278, "category_id": 61, "bbox_list": [ [ 389.39, 136.99, 517.8299999999999, 302.1 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cream puff.", "normal_caption": "cream puff", "solution": [ 389.39, 136.99, 518.83, 303.1 ], "normalized_solution": [ 608, 285, 810, 631 ] }, { "height": 480, "width": 640, "id": 279, "original_id": 1087576, "dataset_name": "refcoco", "area": 60926.53985, "iscrowd": 0, "image_id": 279, "category_id": 61, "bbox_list": [ [ 103.78, 54.59, 403.32000000000005, 319.53999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cake.", "normal_caption": "cake", "solution": [ 103.78, 54.59, 404.32, 320.54 ], "normalized_solution": [ 162, 113, 631, 667 ] }, { "height": 480, "width": 640, "id": 280, "original_id": 1087576, "dataset_name": "refcoco", "area": 60926.53985, "iscrowd": 0, "image_id": 280, "category_id": 61, "bbox_list": [ [ 103.78, 54.59, 403.32000000000005, 319.53999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cake.", "normal_caption": "cake", "solution": [ 103.78, 54.59, 404.32, 320.54 ], "normalized_solution": [ 162, 113, 631, 667 ] }, { "height": 480, "width": 640, "id": 281, "original_id": 1087576, "dataset_name": "refcoco", "area": 60926.53985, "iscrowd": 0, "image_id": 281, "category_id": 61, "bbox_list": [ [ 103.78, 54.59, 403.32000000000005, 319.53999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cake.", "normal_caption": "cake", "solution": [ 103.78, 54.59, 404.32, 320.54 ], "normalized_solution": [ 162, 113, 631, 667 ] }, { "height": 480, "width": 640, "id": 282, "original_id": 116158, "dataset_name": "refcoco", "area": 17302.73915, "iscrowd": 0, "image_id": 282, "category_id": 63, "bbox_list": [ [ 288.0, 155.87, 440.81, 282.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580625.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red chair.", "normal_caption": "red chair", "solution": [ 288.0, 155.87, 441.81, 283.87 ], "normalized_solution": [ 450, 324, 690, 591 ] }, { "height": 480, "width": 640, "id": 283, "original_id": 116158, "dataset_name": "refcoco", "area": 17302.73915, "iscrowd": 0, "image_id": 283, "category_id": 63, "bbox_list": [ [ 288.0, 155.87, 440.81, 282.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580625.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red chair.", "normal_caption": "red chair", "solution": [ 288.0, 155.87, 441.81, 283.87 ], "normalized_solution": [ 450, 324, 690, 591 ] }, { "height": 480, "width": 640, "id": 284, "original_id": 116158, "dataset_name": "refcoco", "area": 17302.73915, "iscrowd": 0, "image_id": 284, "category_id": 63, "bbox_list": [ [ 288.0, 155.87, 440.81, 282.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580625.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the single chair.", "normal_caption": "the single chair", "solution": [ 288.0, 155.87, 441.81, 283.87 ], "normalized_solution": [ 450, 324, 690, 591 ] }, { "height": 480, "width": 640, "id": 285, "original_id": 99191, "dataset_name": "refcoco", "area": 76168.20790000001, "iscrowd": 0, "image_id": 285, "category_id": 63, "bbox_list": [ [ 0.85, 186.71, 397.73, 472.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580625.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couchleft.", "normal_caption": "couchleft", "solution": [ 0.85, 186.71, 398.73, 473.87 ], "normalized_solution": [ 1, 388, 623, 987 ] }, { "height": 480, "width": 640, "id": 286, "original_id": 99191, "dataset_name": "refcoco", "area": 76168.20790000001, "iscrowd": 0, "image_id": 286, "category_id": 63, "bbox_list": [ [ 0.85, 186.71, 397.73, 472.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580625.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red couch.", "normal_caption": "red couch", "solution": [ 0.85, 186.71, 398.73, 473.87 ], "normalized_solution": [ 1, 388, 623, 987 ] }, { "height": 480, "width": 640, "id": 287, "original_id": 99191, "dataset_name": "refcoco", "area": 76168.20790000001, "iscrowd": 0, "image_id": 287, "category_id": 63, "bbox_list": [ [ 0.85, 186.71, 397.73, 472.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580625.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch.", "normal_caption": "couch", "solution": [ 0.85, 186.71, 398.73, 473.87 ], "normalized_solution": [ 1, 388, 623, 987 ] }, { "height": 640, "width": 427, "id": 288, "original_id": 2154747, "dataset_name": "refcoco", "area": 11594.40185, "iscrowd": 0, "image_id": 288, "category_id": 1, "bbox_list": [ [ 1.66, 1.66, 158.57999999999998, 153.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left guy in white.", "normal_caption": "left guy in white", "solution": [ 1.66, 1.66, 159.58, 154.6 ], "normalized_solution": [ 3, 2, 373, 241 ] }, { "height": 640, "width": 427, "id": 289, "original_id": 2154747, "dataset_name": "refcoco", "area": 11594.40185, "iscrowd": 0, "image_id": 289, "category_id": 1, "bbox_list": [ [ 1.66, 1.66, 158.57999999999998, 153.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man above green shirt guy.", "normal_caption": "man above green shirt guy", "solution": [ 1.66, 1.66, 159.58, 154.6 ], "normalized_solution": [ 3, 2, 373, 241 ] }, { "height": 640, "width": 427, "id": 290, "original_id": 2154747, "dataset_name": "refcoco", "area": 11594.40185, "iscrowd": 0, "image_id": 290, "category_id": 1, "bbox_list": [ [ 1.66, 1.66, 158.57999999999998, 153.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: upper left white shirt.", "normal_caption": "upper left white shirt", "solution": [ 1.66, 1.66, 159.58, 154.6 ], "normalized_solution": [ 3, 2, 373, 241 ] }, { "height": 640, "width": 427, "id": 291, "original_id": 535554, "dataset_name": "refcoco", "area": 16076.0192, "iscrowd": 0, "image_id": 291, "category_id": 1, "bbox_list": [ [ 1.44, 37.39, 150.01, 249.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man green shirt left.", "normal_caption": "man green shirt left", "solution": [ 1.44, 37.39, 151.01, 250.25 ], "normalized_solution": [ 3, 58, 353, 391 ] }, { "height": 640, "width": 427, "id": 292, "original_id": 535554, "dataset_name": "refcoco", "area": 16076.0192, "iscrowd": 0, "image_id": 292, "category_id": 1, "bbox_list": [ [ 1.44, 37.39, 150.01, 249.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: dude back green shirt.", "normal_caption": "dude back green shirt", "solution": [ 1.44, 37.39, 151.01, 250.25 ], "normalized_solution": [ 3, 58, 353, 391 ] }, { "height": 640, "width": 427, "id": 293, "original_id": 535554, "dataset_name": "refcoco", "area": 16076.0192, "iscrowd": 0, "image_id": 293, "category_id": 1, "bbox_list": [ [ 1.44, 37.39, 150.01, 249.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: green shirt guy back.", "normal_caption": "green shirt guy back", "solution": [ 1.44, 37.39, 151.01, 250.25 ], "normalized_solution": [ 3, 58, 353, 391 ] }, { "height": 640, "width": 427, "id": 294, "original_id": 519195, "dataset_name": "refcoco", "area": 10958.803450000003, "iscrowd": 0, "image_id": 294, "category_id": 1, "bbox_list": [ [ 299.71, 0.0, 426.0, 234.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the man in background right white hat.", "normal_caption": "the man in background right white hat", "solution": [ 299.71, 0.0, 427.0, 235.92 ], "normalized_solution": [ 701, 0, 1000, 368 ] }, { "height": 640, "width": 427, "id": 295, "original_id": 519195, "dataset_name": "refcoco", "area": 10958.803450000003, "iscrowd": 0, "image_id": 295, "category_id": 1, "bbox_list": [ [ 299.71, 0.0, 426.0, 234.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: spectator on right in ball cap.", "normal_caption": "spectator on right in ball cap", "solution": [ 299.71, 0.0, 427.0, 235.92 ], "normalized_solution": [ 701, 0, 1000, 368 ] }, { "height": 640, "width": 427, "id": 296, "original_id": 519195, "dataset_name": "refcoco", "area": 10958.803450000003, "iscrowd": 0, "image_id": 296, "category_id": 1, "bbox_list": [ [ 299.71, 0.0, 426.0, 234.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy back right.", "normal_caption": "guy back right", "solution": [ 299.71, 0.0, 427.0, 235.92 ], "normalized_solution": [ 701, 0, 1000, 368 ] }, { "height": 640, "width": 427, "id": 297, "original_id": 432877, "dataset_name": "refcoco", "area": 97800.53529999999, "iscrowd": 0, "image_id": 297, "category_id": 1, "bbox_list": [ [ 60.54, 44.68, 317.56, 631.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player.", "normal_caption": "player", "solution": [ 60.54, 44.68, 318.56, 632.79 ], "normalized_solution": [ 141, 69, 746, 988 ] }, { "height": 640, "width": 427, "id": 298, "original_id": 432877, "dataset_name": "refcoco", "area": 97800.53529999999, "iscrowd": 0, "image_id": 298, "category_id": 1, "bbox_list": [ [ 60.54, 44.68, 317.56, 631.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580609.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 60.54, 44.68, 318.56, 632.79 ], "normalized_solution": [ 141, 69, 746, 988 ] }, { "height": 480, "width": 640, "id": 299, "original_id": 1573052, "dataset_name": "refcoco", "area": 11358.65435, "iscrowd": 0, "image_id": 299, "category_id": 60, "bbox_list": [ [ 260.58, 4.8, 421.67999999999995, 119.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chocolate sprinkle donut.", "normal_caption": "chocolate sprinkle donut", "solution": [ 260.58, 4.8, 422.68, 120.21 ], "normalized_solution": [ 407, 10, 660, 250 ] }, { "height": 480, "width": 640, "id": 300, "original_id": 1573052, "dataset_name": "refcoco", "area": 11358.65435, "iscrowd": 0, "image_id": 300, "category_id": 60, "bbox_list": [ [ 260.58, 4.8, 421.67999999999995, 119.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brown donut at the top.", "normal_caption": "brown donut at the top", "solution": [ 260.58, 4.8, 422.68, 120.21 ], "normalized_solution": [ 407, 10, 660, 250 ] }, { "height": 480, "width": 640, "id": 301, "original_id": 1573052, "dataset_name": "refcoco", "area": 11358.65435, "iscrowd": 0, "image_id": 301, "category_id": 60, "bbox_list": [ [ 260.58, 4.8, 421.67999999999995, 119.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right dornut.", "normal_caption": "far right dornut", "solution": [ 260.58, 4.8, 422.68, 120.21 ], "normalized_solution": [ 407, 10, 660, 250 ] }, { "height": 480, "width": 640, "id": 302, "original_id": 1572903, "dataset_name": "refcoco", "area": 18103.430149999993, "iscrowd": 0, "image_id": 302, "category_id": 60, "bbox_list": [ [ 357.28, 66.4, 558.52, 201.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right white donut.", "normal_caption": "right white donut", "solution": [ 357.28, 66.4, 559.52, 202.16 ], "normalized_solution": [ 558, 138, 874, 421 ] }, { "height": 480, "width": 640, "id": 303, "original_id": 1572903, "dataset_name": "refcoco", "area": 18103.430149999993, "iscrowd": 0, "image_id": 303, "category_id": 60, "bbox_list": [ [ 357.28, 66.4, 558.52, 201.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: to the top right of sprinkled white doughnut.", "normal_caption": "to the top right of sprinkled white doughnut", "solution": [ 357.28, 66.4, 559.52, 202.16 ], "normalized_solution": [ 558, 138, 874, 421 ] }, { "height": 480, "width": 640, "id": 304, "original_id": 1572903, "dataset_name": "refcoco", "area": 18103.430149999993, "iscrowd": 0, "image_id": 304, "category_id": 60, "bbox_list": [ [ 357.28, 66.4, 558.52, 201.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white frosted no sprinles on right.", "normal_caption": "white frosted no sprinles on right", "solution": [ 357.28, 66.4, 559.52, 202.16 ], "normalized_solution": [ 558, 138, 874, 421 ] }, { "height": 480, "width": 640, "id": 305, "original_id": 1082752, "dataset_name": "refcoco", "area": 13328.303799999998, "iscrowd": 0, "image_id": 305, "category_id": 60, "bbox_list": [ [ 98.02, 3.96, 262.89, 119.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: donut on top left white.", "normal_caption": "donut on top left white", "solution": [ 98.02, 3.96, 263.89, 120.41 ], "normalized_solution": [ 153, 8, 412, 250 ] }, { "height": 480, "width": 640, "id": 306, "original_id": 1082752, "dataset_name": "refcoco", "area": 13328.303799999998, "iscrowd": 0, "image_id": 306, "category_id": 60, "bbox_list": [ [ 98.02, 3.96, 262.89, 119.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left back white donut.", "normal_caption": "left back white donut", "solution": [ 98.02, 3.96, 263.89, 120.41 ], "normalized_solution": [ 153, 8, 412, 250 ] }, { "height": 480, "width": 640, "id": 307, "original_id": 1082752, "dataset_name": "refcoco", "area": 13328.303799999998, "iscrowd": 0, "image_id": 307, "category_id": 60, "bbox_list": [ [ 98.02, 3.96, 262.89, 119.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white one in the back left.", "normal_caption": "white one in the back left", "solution": [ 98.02, 3.96, 263.89, 120.41 ], "normalized_solution": [ 153, 8, 412, 250 ] }, { "height": 480, "width": 640, "id": 308, "original_id": 1082449, "dataset_name": "refcoco", "area": 16707.2383, "iscrowd": 0, "image_id": 308, "category_id": 60, "bbox_list": [ [ 156.44, 75.88, 352.68, 206.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: from top first one in second row chocolate frosted no sprinkles.", "normal_caption": "from top first one in second row chocolate frosted no sprinkles", "solution": [ 156.44, 75.88, 353.68, 207.59 ], "normalized_solution": [ 244, 158, 552, 432 ] }, { "height": 480, "width": 640, "id": 309, "original_id": 1082449, "dataset_name": "refcoco", "area": 16707.2383, "iscrowd": 0, "image_id": 309, "category_id": 60, "bbox_list": [ [ 156.44, 75.88, 352.68, 206.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brown donut center no sprinkles.", "normal_caption": "brown donut center no sprinkles", "solution": [ 156.44, 75.88, 353.68, 207.59 ], "normalized_solution": [ 244, 158, 552, 432 ] }, { "height": 480, "width": 640, "id": 310, "original_id": 1081561, "dataset_name": "refcoco", "area": 40404.35979999999, "iscrowd": 0, "image_id": 310, "category_id": 60, "bbox_list": [ [ 1.08, 170.43, 257.88, 374.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left most donut sprinkles.", "normal_caption": "left most donut sprinkles", "solution": [ 1.08, 170.43, 258.88, 375.37 ], "normalized_solution": [ 1, 355, 404, 782 ] }, { "height": 480, "width": 640, "id": 311, "original_id": 1081561, "dataset_name": "refcoco", "area": 40404.35979999999, "iscrowd": 0, "image_id": 311, "category_id": 60, "bbox_list": [ [ 1.08, 170.43, 257.88, 374.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sprinkles on left.", "normal_caption": "sprinkles on left", "solution": [ 1.08, 170.43, 258.88, 375.37 ], "normalized_solution": [ 1, 355, 404, 782 ] }, { "height": 480, "width": 640, "id": 312, "original_id": 1081561, "dataset_name": "refcoco", "area": 40404.35979999999, "iscrowd": 0, "image_id": 312, "category_id": 60, "bbox_list": [ [ 1.08, 170.43, 257.88, 374.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: leftmost sprinkled.", "normal_caption": "leftmost sprinkled", "solution": [ 1.08, 170.43, 258.88, 375.37 ], "normalized_solution": [ 1, 355, 404, 782 ] }, { "height": 480, "width": 640, "id": 313, "original_id": 1080785, "dataset_name": "refcoco", "area": 36505.92820000001, "iscrowd": 0, "image_id": 313, "category_id": 60, "bbox_list": [ [ 248.84, 143.15, 499.90999999999997, 333.86 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right sprinkle donut white frosting.", "normal_caption": "right sprinkle donut white frosting", "solution": [ 248.84, 143.15, 500.91, 334.86 ], "normalized_solution": [ 388, 298, 782, 697 ] }, { "height": 480, "width": 640, "id": 314, "original_id": 1080785, "dataset_name": "refcoco", "area": 36505.92820000001, "iscrowd": 0, "image_id": 314, "category_id": 60, "bbox_list": [ [ 248.84, 143.15, 499.90999999999997, 333.86 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right donut sprinkles white icing.", "normal_caption": "right donut sprinkles white icing", "solution": [ 248.84, 143.15, 500.91, 334.86 ], "normalized_solution": [ 388, 298, 782, 697 ] }, { "height": 480, "width": 640, "id": 315, "original_id": 1080785, "dataset_name": "refcoco", "area": 36505.92820000001, "iscrowd": 0, "image_id": 315, "category_id": 60, "bbox_list": [ [ 248.84, 143.15, 499.90999999999997, 333.86 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: donut with sprinkles on right.", "normal_caption": "donut with sprinkles on right", "solution": [ 248.84, 143.15, 500.91, 334.86 ], "normalized_solution": [ 388, 298, 782, 697 ] }, { "height": 480, "width": 640, "id": 316, "original_id": 1078574, "dataset_name": "refcoco", "area": 47408.689000000006, "iscrowd": 0, "image_id": 316, "category_id": 60, "bbox_list": [ [ 107.87, 308.49, 447.72, 477.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom donut.", "normal_caption": "bottom donut", "solution": [ 107.87, 308.49, 448.72, 478.92 ], "normalized_solution": [ 168, 642, 701, 997 ] }, { "height": 480, "width": 640, "id": 317, "original_id": 1078574, "dataset_name": "refcoco", "area": 47408.689000000006, "iscrowd": 0, "image_id": 317, "category_id": 60, "bbox_list": [ [ 107.87, 308.49, 447.72, 477.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front donut.", "normal_caption": "front donut", "solution": [ 107.87, 308.49, 448.72, 478.92 ], "normalized_solution": [ 168, 642, 701, 997 ] }, { "height": 480, "width": 640, "id": 318, "original_id": 1078574, "dataset_name": "refcoco", "area": 47408.689000000006, "iscrowd": 0, "image_id": 318, "category_id": 60, "bbox_list": [ [ 107.87, 308.49, 447.72, 477.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580600.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front donut.", "normal_caption": "front donut", "solution": [ 107.87, 308.49, 448.72, 478.92 ], "normalized_solution": [ 168, 642, 701, 997 ] }, { "height": 480, "width": 640, "id": 319, "original_id": 1081274, "dataset_name": "refcoco", "area": 47012.904800000004, "iscrowd": 0, "image_id": 319, "category_id": 60, "bbox_list": [ [ 0.0, 146.36, 604.74, 352.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580579.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: all doughnut on the outside.", "normal_caption": "all doughnut on the outside", "solution": [ 0.0, 146.36, 605.74, 353.93 ], "normalized_solution": [ 0, 304, 946, 737 ] }, { "height": 480, "width": 640, "id": 320, "original_id": 1081274, "dataset_name": "refcoco", "area": 47012.904800000004, "iscrowd": 0, "image_id": 320, "category_id": 60, "bbox_list": [ [ 0.0, 146.36, 604.74, 352.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580579.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: powder donuts.", "normal_caption": "powder donuts", "solution": [ 0.0, 146.36, 605.74, 353.93 ], "normalized_solution": [ 0, 304, 946, 737 ] }, { "height": 480, "width": 640, "id": 321, "original_id": 1081274, "dataset_name": "refcoco", "area": 47012.904800000004, "iscrowd": 0, "image_id": 321, "category_id": 60, "bbox_list": [ [ 0.0, 146.36, 604.74, 352.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580579.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white donut on right.", "normal_caption": "white donut on right", "solution": [ 0.0, 146.36, 605.74, 353.93 ], "normalized_solution": [ 0, 304, 946, 737 ] }, { "height": 480, "width": 640, "id": 322, "original_id": 1078418, "dataset_name": "refcoco", "area": 11597.144450000002, "iscrowd": 0, "image_id": 322, "category_id": 60, "bbox_list": [ [ 245.93, 187.69, 393.79, 297.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580579.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: donut center of box with creamy frosting and nuts.", "normal_caption": "donut center of box with creamy frosting and nuts", "solution": [ 245.93, 187.69, 394.79, 298.79 ], "normalized_solution": [ 384, 391, 616, 622 ] }, { "height": 480, "width": 640, "id": 323, "original_id": 1078418, "dataset_name": "refcoco", "area": 11597.144450000002, "iscrowd": 0, "image_id": 323, "category_id": 60, "bbox_list": [ [ 245.93, 187.69, 393.79, 297.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580579.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white donut toward middle.", "normal_caption": "white donut toward middle", "solution": [ 245.93, 187.69, 394.79, 298.79 ], "normalized_solution": [ 384, 391, 616, 622 ] }, { "height": 480, "width": 640, "id": 324, "original_id": 1078418, "dataset_name": "refcoco", "area": 11597.144450000002, "iscrowd": 0, "image_id": 324, "category_id": 60, "bbox_list": [ [ 245.93, 187.69, 393.79, 297.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580579.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: center donut with nuts on top.", "normal_caption": "center donut with nuts on top", "solution": [ 245.93, 187.69, 394.79, 298.79 ], "normalized_solution": [ 384, 391, 616, 622 ] }, { "height": 480, "width": 640, "id": 325, "original_id": 400876, "dataset_name": "refcoco", "area": 17503.45175, "iscrowd": 0, "image_id": 325, "category_id": 8, "bbox_list": [ [ 0.0, 205.61, 186.66, 371.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580562.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: gray dump truck.", "normal_caption": "gray dump truck", "solution": [ 0.0, 205.61, 187.66, 372.41 ], "normalized_solution": [ 0, 428, 293, 775 ] }, { "height": 480, "width": 640, "id": 326, "original_id": 400876, "dataset_name": "refcoco", "area": 17503.45175, "iscrowd": 0, "image_id": 326, "category_id": 8, "bbox_list": [ [ 0.0, 205.61, 186.66, 371.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580562.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left partial gray truck.", "normal_caption": "left partial gray truck", "solution": [ 0.0, 205.61, 187.66, 372.41 ], "normalized_solution": [ 0, 428, 293, 775 ] }, { "height": 480, "width": 640, "id": 327, "original_id": 400876, "dataset_name": "refcoco", "area": 17503.45175, "iscrowd": 0, "image_id": 327, "category_id": 8, "bbox_list": [ [ 0.0, 205.61, 186.66, 371.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580562.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: gray cargo.", "normal_caption": "gray cargo", "solution": [ 0.0, 205.61, 187.66, 372.41 ], "normalized_solution": [ 0, 428, 293, 775 ] }, { "height": 480, "width": 640, "id": 328, "original_id": 396728, "dataset_name": "refcoco", "area": 87202.26919999998, "iscrowd": 0, "image_id": 328, "category_id": 8, "bbox_list": [ [ 85.6, 137.88, 589.52, 381.75 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580562.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red truck.", "normal_caption": "red truck", "solution": [ 85.6, 137.88, 590.52, 382.75 ], "normalized_solution": [ 133, 287, 922, 797 ] }, { "height": 480, "width": 640, "id": 329, "original_id": 396728, "dataset_name": "refcoco", "area": 87202.26919999998, "iscrowd": 0, "image_id": 329, "category_id": 8, "bbox_list": [ [ 85.6, 137.88, 589.52, 381.75 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580562.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: truck.", "normal_caption": "truck", "solution": [ 85.6, 137.88, 590.52, 382.75 ], "normalized_solution": [ 133, 287, 922, 797 ] }, { "height": 480, "width": 640, "id": 330, "original_id": 396728, "dataset_name": "refcoco", "area": 87202.26919999998, "iscrowd": 0, "image_id": 330, "category_id": 8, "bbox_list": [ [ 85.6, 137.88, 589.52, 381.75 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580562.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: truck.", "normal_caption": "truck", "solution": [ 85.6, 137.88, 590.52, 382.75 ], "normalized_solution": [ 133, 287, 922, 797 ] }, { "height": 480, "width": 640, "id": 331, "original_id": 167760, "dataset_name": "refcoco", "area": 15910.16625, "iscrowd": 0, "image_id": 331, "category_id": 6, "bbox_list": [ [ 24.86, 200.54, 154.68, 335.76 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580549.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left bus.", "normal_caption": "left bus", "solution": [ 24.86, 200.54, 155.68, 336.76 ], "normalized_solution": [ 38, 417, 243, 701 ] }, { "height": 480, "width": 640, "id": 332, "original_id": 167760, "dataset_name": "refcoco", "area": 15910.16625, "iscrowd": 0, "image_id": 332, "category_id": 6, "bbox_list": [ [ 24.86, 200.54, 154.68, 335.76 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580549.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bus on left.", "normal_caption": "bus on left", "solution": [ 24.86, 200.54, 155.68, 336.76 ], "normalized_solution": [ 38, 417, 243, 701 ] }, { "height": 480, "width": 640, "id": 333, "original_id": 167760, "dataset_name": "refcoco", "area": 15910.16625, "iscrowd": 0, "image_id": 333, "category_id": 6, "bbox_list": [ [ 24.86, 200.54, 154.68, 335.76 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580549.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far left bus.", "normal_caption": "far left bus", "solution": [ 24.86, 200.54, 155.68, 336.76 ], "normalized_solution": [ 38, 417, 243, 701 ] }, { "height": 480, "width": 640, "id": 334, "original_id": 166290, "dataset_name": "refcoco", "area": 62307.72130000001, "iscrowd": 0, "image_id": 334, "category_id": 6, "bbox_list": [ [ 152.09, 189.84, 607.36, 353.88 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580549.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bus in front.", "normal_caption": "bus in front", "solution": [ 152.09, 189.84, 608.36, 354.88 ], "normalized_solution": [ 237, 395, 950, 739 ] }, { "height": 480, "width": 640, "id": 335, "original_id": 166290, "dataset_name": "refcoco", "area": 62307.72130000001, "iscrowd": 0, "image_id": 335, "category_id": 6, "bbox_list": [ [ 152.09, 189.84, 607.36, 353.88 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580549.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bus in front.", "normal_caption": "bus in front", "solution": [ 152.09, 189.84, 608.36, 354.88 ], "normalized_solution": [ 237, 395, 950, 739 ] }, { "height": 480, "width": 640, "id": 336, "original_id": 166290, "dataset_name": "refcoco", "area": 62307.72130000001, "iscrowd": 0, "image_id": 336, "category_id": 6, "bbox_list": [ [ 152.09, 189.84, 607.36, 353.88 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580549.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front bus.", "normal_caption": "front bus", "solution": [ 152.09, 189.84, 608.36, 354.88 ], "normalized_solution": [ 237, 395, 950, 739 ] }, { "height": 640, "width": 480, "id": 337, "original_id": 704443, "dataset_name": "refcoco", "area": 12148.273350000003, "iscrowd": 0, "image_id": 337, "category_id": 50, "bbox_list": [ [ 0.0, 191.7, 204.94, 287.54999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580541.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top spoon on plate.", "normal_caption": "top spoon on plate", "solution": [ 0.0, 191.7, 205.94, 288.55 ], "normalized_solution": [ 0, 299, 429, 450 ] }, { "height": 640, "width": 480, "id": 338, "original_id": 704443, "dataset_name": "refcoco", "area": 12148.273350000003, "iscrowd": 0, "image_id": 338, "category_id": 50, "bbox_list": [ [ 0.0, 191.7, 204.94, 287.54999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580541.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top spoon on plate.", "normal_caption": "top spoon on plate", "solution": [ 0.0, 191.7, 205.94, 288.55 ], "normalized_solution": [ 0, 299, 429, 450 ] }, { "height": 640, "width": 480, "id": 339, "original_id": 704443, "dataset_name": "refcoco", "area": 12148.273350000003, "iscrowd": 0, "image_id": 339, "category_id": 50, "bbox_list": [ [ 0.0, 191.7, 204.94, 287.54999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580541.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: spoon on the left.", "normal_caption": "spoon on the left", "solution": [ 0.0, 191.7, 205.94, 288.55 ], "normalized_solution": [ 0, 299, 429, 450 ] }, { "height": 640, "width": 480, "id": 340, "original_id": 704091, "dataset_name": "refcoco", "area": 18689.2502, "iscrowd": 0, "image_id": 340, "category_id": 50, "bbox_list": [ [ 0.0, 376.73, 400.3, 638.58 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580541.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom spoon.", "normal_caption": "bottom spoon", "solution": [ 0.0, 376.73, 401.3, 639.58 ], "normalized_solution": [ 0, 588, 836, 999 ] }, { "height": 640, "width": 480, "id": 341, "original_id": 704091, "dataset_name": "refcoco", "area": 18689.2502, "iscrowd": 0, "image_id": 341, "category_id": 50, "bbox_list": [ [ 0.0, 376.73, 400.3, 638.58 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580541.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: spoon.", "normal_caption": "spoon", "solution": [ 0.0, 376.73, 401.3, 639.58 ], "normalized_solution": [ 0, 588, 836, 999 ] }, { "height": 640, "width": 480, "id": 342, "original_id": 704091, "dataset_name": "refcoco", "area": 18689.2502, "iscrowd": 0, "image_id": 342, "category_id": 50, "bbox_list": [ [ 0.0, 376.73, 400.3, 638.58 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580541.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom spoon.", "normal_caption": "bottom spoon", "solution": [ 0.0, 376.73, 401.3, 639.58 ], "normalized_solution": [ 0, 588, 836, 999 ] }, { "height": 425, "width": 640, "id": 343, "original_id": 468744, "dataset_name": "refcoco", "area": 56598.93265, "iscrowd": 0, "image_id": 343, "category_id": 1, "bbox_list": [ [ 404.94, 93.66, 639.0, 407.83000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady.", "normal_caption": "lady", "solution": [ 404.94, 93.66, 640.0, 408.83 ], "normalized_solution": [ 632, 220, 1000, 961 ] }, { "height": 425, "width": 640, "id": 344, "original_id": 468744, "dataset_name": "refcoco", "area": 56598.93265, "iscrowd": 0, "image_id": 344, "category_id": 1, "bbox_list": [ [ 404.94, 93.66, 639.0, 407.83000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the woman.", "normal_caption": "the woman", "solution": [ 404.94, 93.66, 640.0, 408.83 ], "normalized_solution": [ 632, 220, 1000, 961 ] }, { "height": 425, "width": 640, "id": 345, "original_id": 468744, "dataset_name": "refcoco", "area": 56598.93265, "iscrowd": 0, "image_id": 345, "category_id": 1, "bbox_list": [ [ 404.94, 93.66, 639.0, 407.83000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 404.94, 93.66, 640.0, 408.83 ], "normalized_solution": [ 632, 220, 1000, 961 ] }, { "height": 425, "width": 640, "id": 346, "original_id": 428122, "dataset_name": "refcoco", "area": 109232.86249999999, "iscrowd": 0, "image_id": 346, "category_id": 1, "bbox_list": [ [ 0.0, 63.18, 470.9, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man with glasses.", "normal_caption": "man with glasses", "solution": [ 0.0, 63.18, 471.9, 425.0 ], "normalized_solution": [ 0, 148, 737, 1000 ] }, { "height": 425, "width": 640, "id": 347, "original_id": 428122, "dataset_name": "refcoco", "area": 109232.86249999999, "iscrowd": 0, "image_id": 347, "category_id": 1, "bbox_list": [ [ 0.0, 63.18, 470.9, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 0.0, 63.18, 471.9, 425.0 ], "normalized_solution": [ 0, 148, 737, 1000 ] }, { "height": 425, "width": 640, "id": 348, "original_id": 428122, "dataset_name": "refcoco", "area": 109232.86249999999, "iscrowd": 0, "image_id": 348, "category_id": 1, "bbox_list": [ [ 0.0, 63.18, 470.9, 424.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 0.0, 63.18, 471.9, 425.0 ], "normalized_solution": [ 0, 148, 737, 1000 ] }, { "height": 480, "width": 640, "id": 349, "original_id": 595610, "dataset_name": "refcoco", "area": 26805.096750000004, "iscrowd": 0, "image_id": 349, "category_id": 25, "bbox_list": [ [ 398.02, 39.97, 627.47, 428.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580510.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girrffe on right.", "normal_caption": "girrffe on right", "solution": [ 398.02, 39.97, 628.47, 429.27 ], "normalized_solution": [ 621, 83, 981, 894 ] }, { "height": 480, "width": 640, "id": 350, "original_id": 595610, "dataset_name": "refcoco", "area": 26805.096750000004, "iscrowd": 0, "image_id": 350, "category_id": 25, "bbox_list": [ [ 398.02, 39.97, 627.47, 428.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580510.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: big giraffe on right.", "normal_caption": "big giraffe on right", "solution": [ 398.02, 39.97, 628.47, 429.27 ], "normalized_solution": [ 621, 83, 981, 894 ] }, { "height": 480, "width": 640, "id": 351, "original_id": 595610, "dataset_name": "refcoco", "area": 26805.096750000004, "iscrowd": 0, "image_id": 351, "category_id": 25, "bbox_list": [ [ 398.02, 39.97, 627.47, 428.27 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580510.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right giraf.", "normal_caption": "right giraf", "solution": [ 398.02, 39.97, 628.47, 429.27 ], "normalized_solution": [ 621, 83, 981, 894 ] }, { "height": 480, "width": 640, "id": 352, "original_id": 594546, "dataset_name": "refcoco", "area": 26448.83585, "iscrowd": 0, "image_id": 352, "category_id": 25, "bbox_list": [ [ 213.57, 97.35, 474.69, 431.80999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580510.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left giraffe.", "normal_caption": "left giraffe", "solution": [ 213.57, 97.35, 475.69, 432.81 ], "normalized_solution": [ 333, 202, 743, 901 ] }, { "height": 480, "width": 640, "id": 353, "original_id": 594546, "dataset_name": "refcoco", "area": 26448.83585, "iscrowd": 0, "image_id": 353, "category_id": 25, "bbox_list": [ [ 213.57, 97.35, 474.69, 431.80999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580510.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle giraffe.", "normal_caption": "middle giraffe", "solution": [ 213.57, 97.35, 475.69, 432.81 ], "normalized_solution": [ 333, 202, 743, 901 ] }, { "height": 480, "width": 640, "id": 354, "original_id": 594546, "dataset_name": "refcoco", "area": 26448.83585, "iscrowd": 0, "image_id": 354, "category_id": 25, "bbox_list": [ [ 213.57, 97.35, 474.69, 431.80999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580510.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left giraffe big.", "normal_caption": "left giraffe big", "solution": [ 213.57, 97.35, 475.69, 432.81 ], "normalized_solution": [ 333, 202, 743, 901 ] }, { "height": 469, "width": 640, "id": 355, "original_id": 1283502, "dataset_name": "refcoco", "area": 52858.03964999999, "iscrowd": 0, "image_id": 355, "category_id": 1, "bbox_list": [ [ 4.28, 113.5, 290.25, 468.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 4.28, 113.5, 291.25, 469.0 ], "normalized_solution": [ 6, 242, 455, 1000 ] }, { "height": 469, "width": 640, "id": 356, "original_id": 1283502, "dataset_name": "refcoco", "area": 52858.03964999999, "iscrowd": 0, "image_id": 356, "category_id": 1, "bbox_list": [ [ 4.28, 113.5, 290.25, 468.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on left in black.", "normal_caption": "woman on left in black", "solution": [ 4.28, 113.5, 291.25, 469.0 ], "normalized_solution": [ 6, 242, 455, 1000 ] }, { "height": 469, "width": 640, "id": 357, "original_id": 1251093, "dataset_name": "refcoco", "area": 90780.60010000001, "iscrowd": 0, "image_id": 357, "category_id": 1, "bbox_list": [ [ 204.92, 80.81, 559.9, 463.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in white parka.", "normal_caption": "girl in white parka", "solution": [ 204.92, 80.81, 560.9, 464.25 ], "normalized_solution": [ 320, 172, 876, 989 ] }, { "height": 469, "width": 640, "id": 358, "original_id": 1251093, "dataset_name": "refcoco", "area": 90780.60010000001, "iscrowd": 0, "image_id": 358, "category_id": 1, "bbox_list": [ [ 204.92, 80.81, 559.9, 463.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white coat.", "normal_caption": "white coat", "solution": [ 204.92, 80.81, 560.9, 464.25 ], "normalized_solution": [ 320, 172, 876, 989 ] }, { "height": 469, "width": 640, "id": 359, "original_id": 1251093, "dataset_name": "refcoco", "area": 90780.60010000001, "iscrowd": 0, "image_id": 359, "category_id": 1, "bbox_list": [ [ 204.92, 80.81, 559.9, 463.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in white.", "normal_caption": "woman in white", "solution": [ 204.92, 80.81, 560.9, 464.25 ], "normalized_solution": [ 320, 172, 876, 989 ] }, { "height": 469, "width": 640, "id": 360, "original_id": 1727383, "dataset_name": "refcoco", "area": 32713.919400000002, "iscrowd": 0, "image_id": 360, "category_id": 1, "bbox_list": [ [ 446.87, 50.59, 627.14, 468.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man yellow black scarf.", "normal_caption": "man yellow black scarf", "solution": [ 446.87, 50.59, 628.14, 469.0 ], "normalized_solution": [ 698, 107, 981, 1000 ] }, { "height": 469, "width": 640, "id": 361, "original_id": 1727383, "dataset_name": "refcoco", "area": 32713.919400000002, "iscrowd": 0, "image_id": 361, "category_id": 1, "bbox_list": [ [ 446.87, 50.59, 627.14, 468.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: gray shirt.", "normal_caption": "gray shirt", "solution": [ 446.87, 50.59, 628.14, 469.0 ], "normalized_solution": [ 698, 107, 981, 1000 ] }, { "height": 469, "width": 640, "id": 362, "original_id": 1727383, "dataset_name": "refcoco", "area": 32713.919400000002, "iscrowd": 0, "image_id": 362, "category_id": 1, "bbox_list": [ [ 446.87, 50.59, 627.14, 468.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580505.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right guy.", "normal_caption": "right guy", "solution": [ 446.87, 50.59, 628.14, 469.0 ], "normalized_solution": [ 698, 107, 981, 1000 ] }, { "height": 412, "width": 640, "id": 363, "original_id": 525009, "dataset_name": "refcoco", "area": 25015.630200000007, "iscrowd": 0, "image_id": 363, "category_id": 1, "bbox_list": [ [ 117.71, 47.92, 267.23, 366.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person with blue jacket.", "normal_caption": "person with blue jacket", "solution": [ 117.71, 47.92, 268.23, 367.29 ], "normalized_solution": [ 183, 116, 419, 891 ] }, { "height": 412, "width": 640, "id": 364, "original_id": 525009, "dataset_name": "refcoco", "area": 25015.630200000007, "iscrowd": 0, "image_id": 364, "category_id": 1, "bbox_list": [ [ 117.71, 47.92, 267.23, 366.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: one in blue.", "normal_caption": "one in blue", "solution": [ 117.71, 47.92, 268.23, 367.29 ], "normalized_solution": [ 183, 116, 419, 891 ] }, { "height": 412, "width": 640, "id": 365, "original_id": 525009, "dataset_name": "refcoco", "area": 25015.630200000007, "iscrowd": 0, "image_id": 365, "category_id": 1, "bbox_list": [ [ 117.71, 47.92, 267.23, 366.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on left.", "normal_caption": "person on left", "solution": [ 117.71, 47.92, 268.23, 367.29 ], "normalized_solution": [ 183, 116, 419, 891 ] }, { "height": 412, "width": 640, "id": 366, "original_id": 492842, "dataset_name": "refcoco", "area": 24255.090649999995, "iscrowd": 0, "image_id": 366, "category_id": 1, "bbox_list": [ [ 377.67, 32.01, 525.14, 350.21999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right women.", "normal_caption": "right women", "solution": [ 377.67, 32.01, 526.14, 351.22 ], "normalized_solution": [ 590, 77, 822, 852 ] }, { "height": 412, "width": 640, "id": 367, "original_id": 492842, "dataset_name": "refcoco", "area": 24255.090649999995, "iscrowd": 0, "image_id": 367, "category_id": 1, "bbox_list": [ [ 377.67, 32.01, 525.14, 350.21999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right.", "normal_caption": "woman on right", "solution": [ 377.67, 32.01, 526.14, 351.22 ], "normalized_solution": [ 590, 77, 822, 852 ] }, { "height": 412, "width": 640, "id": 368, "original_id": 492842, "dataset_name": "refcoco", "area": 24255.090649999995, "iscrowd": 0, "image_id": 368, "category_id": 1, "bbox_list": [ [ 377.67, 32.01, 525.14, 350.21999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady on right.", "normal_caption": "lady on right", "solution": [ 377.67, 32.01, 526.14, 351.22 ], "normalized_solution": [ 590, 77, 822, 852 ] }, { "height": 412, "width": 640, "id": 369, "original_id": 437779, "dataset_name": "refcoco", "area": 11179.62435, "iscrowd": 0, "image_id": 369, "category_id": 1, "bbox_list": [ [ 303.7, 152.02, 395.03999999999996, 360.90999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid.", "normal_caption": "kid", "solution": [ 303.7, 152.02, 396.04, 361.91 ], "normalized_solution": [ 474, 368, 618, 878 ] }, { "height": 412, "width": 640, "id": 370, "original_id": 437779, "dataset_name": "refcoco", "area": 11179.62435, "iscrowd": 0, "image_id": 370, "category_id": 1, "bbox_list": [ [ 303.7, 152.02, 395.03999999999996, 360.90999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: child.", "normal_caption": "child", "solution": [ 303.7, 152.02, 396.04, 361.91 ], "normalized_solution": [ 474, 368, 618, 878 ] }, { "height": 412, "width": 640, "id": 371, "original_id": 437779, "dataset_name": "refcoco", "area": 11179.62435, "iscrowd": 0, "image_id": 371, "category_id": 1, "bbox_list": [ [ 303.7, 152.02, 395.03999999999996, 360.90999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580434.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink suit.", "normal_caption": "pink suit", "solution": [ 303.7, 152.02, 396.04, 361.91 ], "normalized_solution": [ 474, 368, 618, 878 ] }, { "height": 640, "width": 512, "id": 372, "original_id": 505324, "dataset_name": "refcoco", "area": 61154.41240000001, "iscrowd": 0, "image_id": 372, "category_id": 1, "bbox_list": [ [ 50.34, 76.22, 289.52, 630.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580408.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman with glasses.", "normal_caption": "woman with glasses", "solution": [ 50.34, 76.22, 290.52, 631.37 ], "normalized_solution": [ 98, 119, 567, 986 ] }, { "height": 640, "width": 512, "id": 373, "original_id": 505324, "dataset_name": "refcoco", "area": 61154.41240000001, "iscrowd": 0, "image_id": 373, "category_id": 1, "bbox_list": [ [ 50.34, 76.22, 289.52, 630.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580408.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person holding blow drier.", "normal_caption": "person holding blow drier", "solution": [ 50.34, 76.22, 290.52, 631.37 ], "normalized_solution": [ 98, 119, 567, 986 ] }, { "height": 640, "width": 512, "id": 374, "original_id": 505324, "dataset_name": "refcoco", "area": 61154.41240000001, "iscrowd": 0, "image_id": 374, "category_id": 1, "bbox_list": [ [ 50.34, 76.22, 289.52, 630.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580408.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: back lady.", "normal_caption": "back lady", "solution": [ 50.34, 76.22, 290.52, 631.37 ], "normalized_solution": [ 98, 119, 567, 986 ] }, { "height": 640, "width": 512, "id": 375, "original_id": 443664, "dataset_name": "refcoco", "area": 105929.45969999999, "iscrowd": 0, "image_id": 375, "category_id": 1, "bbox_list": [ [ 143.82, 156.76, 502.37, 631.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580408.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front woman.", "normal_caption": "front woman", "solution": [ 143.82, 156.76, 503.37, 632.81 ], "normalized_solution": [ 280, 244, 983, 988 ] }, { "height": 640, "width": 512, "id": 376, "original_id": 443664, "dataset_name": "refcoco", "area": 105929.45969999999, "iscrowd": 0, "image_id": 376, "category_id": 1, "bbox_list": [ [ 143.82, 156.76, 502.37, 631.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580408.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front gitl.", "normal_caption": "front gitl", "solution": [ 143.82, 156.76, 503.37, 632.81 ], "normalized_solution": [ 280, 244, 983, 988 ] }, { "height": 640, "width": 512, "id": 377, "original_id": 443664, "dataset_name": "refcoco", "area": 105929.45969999999, "iscrowd": 0, "image_id": 377, "category_id": 1, "bbox_list": [ [ 143.82, 156.76, 502.37, 631.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580408.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in front.", "normal_caption": "girl in front", "solution": [ 143.82, 156.76, 503.37, 632.81 ], "normalized_solution": [ 280, 244, 983, 988 ] }, { "height": 472, "width": 640, "id": 378, "original_id": 1709147, "dataset_name": "refcoco", "area": 25271.057950000006, "iscrowd": 0, "image_id": 378, "category_id": 1, "bbox_list": [ [ 432.84, 59.37, 598.0, 311.3 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: women sitting on right.", "normal_caption": "women sitting on right", "solution": [ 432.84, 59.37, 599.0, 312.3 ], "normalized_solution": [ 676, 125, 935, 661 ] }, { "height": 472, "width": 640, "id": 379, "original_id": 1709147, "dataset_name": "refcoco", "area": 25271.057950000006, "iscrowd": 0, "image_id": 379, "category_id": 1, "bbox_list": [ [ 432.84, 59.37, 598.0, 311.3 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman behind racket.", "normal_caption": "woman behind racket", "solution": [ 432.84, 59.37, 599.0, 312.3 ], "normalized_solution": [ 676, 125, 935, 661 ] }, { "height": 472, "width": 640, "id": 380, "original_id": 1709147, "dataset_name": "refcoco", "area": 25271.057950000006, "iscrowd": 0, "image_id": 380, "category_id": 1, "bbox_list": [ [ 432.84, 59.37, 598.0, 311.3 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady sitting down but not in stands.", "normal_caption": "lady sitting down but not in stands", "solution": [ 432.84, 59.37, 599.0, 312.3 ], "normalized_solution": [ 676, 125, 935, 661 ] }, { "height": 472, "width": 640, "id": 381, "original_id": 464873, "dataset_name": "refcoco", "area": 13001.2688, "iscrowd": 0, "image_id": 381, "category_id": 1, "bbox_list": [ [ 80.25, 0.0, 220.74, 126.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue spectator.", "normal_caption": "blue spectator", "solution": [ 80.25, 0.0, 221.74, 127.87 ], "normalized_solution": [ 125, 0, 346, 270 ] }, { "height": 472, "width": 640, "id": 382, "original_id": 464873, "dataset_name": "refcoco", "area": 13001.2688, "iscrowd": 0, "image_id": 382, "category_id": 1, "bbox_list": [ [ 80.25, 0.0, 220.74, 126.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue shirt top left.", "normal_caption": "blue shirt top left", "solution": [ 80.25, 0.0, 221.74, 127.87 ], "normalized_solution": [ 125, 0, 346, 270 ] }, { "height": 472, "width": 640, "id": 383, "original_id": 464873, "dataset_name": "refcoco", "area": 13001.2688, "iscrowd": 0, "image_id": 383, "category_id": 1, "bbox_list": [ [ 80.25, 0.0, 220.74, 126.87 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue shirt guy standing on the left.", "normal_caption": "blue shirt guy standing on the left", "solution": [ 80.25, 0.0, 221.74, 127.87 ], "normalized_solution": [ 125, 0, 346, 270 ] }, { "height": 472, "width": 640, "id": 384, "original_id": 452819, "dataset_name": "refcoco", "area": 59154.707350000004, "iscrowd": 0, "image_id": 384, "category_id": 1, "bbox_list": [ [ 228.08, 12.58, 474.17, 467.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front and center girl.", "normal_caption": "front and center girl", "solution": [ 228.08, 12.58, 475.17, 468.74 ], "normalized_solution": [ 356, 26, 742, 993 ] }, { "height": 472, "width": 640, "id": 385, "original_id": 452819, "dataset_name": "refcoco", "area": 59154.707350000004, "iscrowd": 0, "image_id": 385, "category_id": 1, "bbox_list": [ [ 228.08, 12.58, 474.17, 467.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player.", "normal_caption": "player", "solution": [ 228.08, 12.58, 475.17, 468.74 ], "normalized_solution": [ 356, 26, 742, 993 ] }, { "height": 472, "width": 640, "id": 386, "original_id": 452819, "dataset_name": "refcoco", "area": 59154.707350000004, "iscrowd": 0, "image_id": 386, "category_id": 1, "bbox_list": [ [ 228.08, 12.58, 474.17, 467.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580396.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chick with the racket.", "normal_caption": "chick with the racket", "solution": [ 228.08, 12.58, 475.17, 468.74 ], "normalized_solution": [ 356, 26, 742, 993 ] }, { "height": 424, "width": 640, "id": 387, "original_id": 1706014, "dataset_name": "refcoco", "area": 14429.973649999998, "iscrowd": 0, "image_id": 387, "category_id": 1, "bbox_list": [ [ 492.76, 1.43, 639.0, 140.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand in top right corner.", "normal_caption": "hand in top right corner", "solution": [ 492.76, 1.43, 640.0, 141.81 ], "normalized_solution": [ 769, 3, 1000, 334 ] }, { "height": 424, "width": 640, "id": 388, "original_id": 1706014, "dataset_name": "refcoco", "area": 14429.973649999998, "iscrowd": 0, "image_id": 388, "category_id": 1, "bbox_list": [ [ 492.76, 1.43, 639.0, 140.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand far right.", "normal_caption": "hand far right", "solution": [ 492.76, 1.43, 640.0, 141.81 ], "normalized_solution": [ 769, 3, 1000, 334 ] }, { "height": 424, "width": 640, "id": 389, "original_id": 683291, "dataset_name": "refcoco", "area": 15699.134349999998, "iscrowd": 0, "image_id": 389, "category_id": 47, "bbox_list": [ [ 99.07, 16.93, 199.18, 215.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: beer on left.", "normal_caption": "beer on left", "solution": [ 99.07, 16.93, 200.18, 216.41 ], "normalized_solution": [ 154, 39, 312, 510 ] }, { "height": 424, "width": 640, "id": 390, "original_id": 683291, "dataset_name": "refcoco", "area": 15699.134349999998, "iscrowd": 0, "image_id": 390, "category_id": 47, "bbox_list": [ [ 99.07, 16.93, 199.18, 215.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left most glass.", "normal_caption": "left most glass", "solution": [ 99.07, 16.93, 200.18, 216.41 ], "normalized_solution": [ 154, 39, 312, 510 ] }, { "height": 424, "width": 640, "id": 391, "original_id": 683291, "dataset_name": "refcoco", "area": 15699.134349999998, "iscrowd": 0, "image_id": 391, "category_id": 47, "bbox_list": [ [ 99.07, 16.93, 199.18, 215.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: half empty glass left.", "normal_caption": "half empty glass left", "solution": [ 99.07, 16.93, 200.18, 216.41 ], "normalized_solution": [ 154, 39, 312, 510 ] }, { "height": 424, "width": 640, "id": 392, "original_id": 682871, "dataset_name": "refcoco", "area": 16409.60945, "iscrowd": 0, "image_id": 392, "category_id": 47, "bbox_list": [ [ 389.78, 43.35, 494.29999999999995, 228.68 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: glass of beer in middle behind burger.", "normal_caption": "glass of beer in middle behind burger", "solution": [ 389.78, 43.35, 495.3, 229.68 ], "normalized_solution": [ 609, 102, 773, 541 ] }, { "height": 424, "width": 640, "id": 393, "original_id": 682871, "dataset_name": "refcoco", "area": 16409.60945, "iscrowd": 0, "image_id": 393, "category_id": 47, "bbox_list": [ [ 389.78, 43.35, 494.29999999999995, 228.68 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: glass on right.", "normal_caption": "glass on right", "solution": [ 389.78, 43.35, 495.3, 229.68 ], "normalized_solution": [ 609, 102, 773, 541 ] }, { "height": 424, "width": 640, "id": 394, "original_id": 682871, "dataset_name": "refcoco", "area": 16409.60945, "iscrowd": 0, "image_id": 394, "category_id": 47, "bbox_list": [ [ 389.78, 43.35, 494.29999999999995, 228.68 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: glass behind burger.", "normal_caption": "glass behind burger", "solution": [ 389.78, 43.35, 495.3, 229.68 ], "normalized_solution": [ 609, 102, 773, 541 ] }, { "height": 424, "width": 640, "id": 395, "original_id": 438134, "dataset_name": "refcoco", "area": 53645.597299999994, "iscrowd": 0, "image_id": 395, "category_id": 1, "bbox_list": [ [ 1.91, 2.86, 425.86, 180.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the person on the left.", "normal_caption": "the person on the left", "solution": [ 1.91, 2.86, 426.86, 181.03 ], "normalized_solution": [ 2, 6, 666, 426 ] }, { "height": 424, "width": 640, "id": 396, "original_id": 438134, "dataset_name": "refcoco", "area": 53645.597299999994, "iscrowd": 0, "image_id": 396, "category_id": 1, "bbox_list": [ [ 1.91, 2.86, 425.86, 180.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580344.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hands on left top.", "normal_caption": "hands on left top", "solution": [ 1.91, 2.86, 426.86, 181.03 ], "normalized_solution": [ 2, 6, 666, 426 ] }, { "height": 502, "width": 640, "id": 397, "original_id": 587559, "dataset_name": "refcoco", "area": 51960.03205000002, "iscrowd": 0, "image_id": 397, "category_id": 23, "bbox_list": [ [ 287.5, 94.44, 518.97, 446.08 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580296.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bear on the right.", "normal_caption": "bear on the right", "solution": [ 287.5, 94.44, 519.97, 447.08 ], "normalized_solution": [ 449, 188, 812, 890 ] }, { "height": 502, "width": 640, "id": 398, "original_id": 587559, "dataset_name": "refcoco", "area": 51960.03205000002, "iscrowd": 0, "image_id": 398, "category_id": 23, "bbox_list": [ [ 287.5, 94.44, 518.97, 446.08 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580296.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right bear.", "normal_caption": "right bear", "solution": [ 287.5, 94.44, 519.97, 447.08 ], "normalized_solution": [ 449, 188, 812, 890 ] }, { "height": 502, "width": 640, "id": 399, "original_id": 587559, "dataset_name": "refcoco", "area": 51960.03205000002, "iscrowd": 0, "image_id": 399, "category_id": 23, "bbox_list": [ [ 287.5, 94.44, 518.97, 446.08 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580296.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: animal on right with paws on cage.", "normal_caption": "animal on right with paws on cage", "solution": [ 287.5, 94.44, 519.97, 447.08 ], "normalized_solution": [ 449, 188, 812, 890 ] }, { "height": 502, "width": 640, "id": 400, "original_id": 587040, "dataset_name": "refcoco", "area": 27243.198099999998, "iscrowd": 0, "image_id": 400, "category_id": 23, "bbox_list": [ [ 151.23, 171.7, 384.53999999999996, 380.04999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580296.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left animal.", "normal_caption": "left animal", "solution": [ 151.23, 171.7, 385.54, 381.05 ], "normalized_solution": [ 236, 342, 602, 759 ] }, { "height": 502, "width": 640, "id": 401, "original_id": 587040, "dataset_name": "refcoco", "area": 27243.198099999998, "iscrowd": 0, "image_id": 401, "category_id": 23, "bbox_list": [ [ 151.23, 171.7, 384.53999999999996, 380.04999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580296.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left bear.", "normal_caption": "left bear", "solution": [ 151.23, 171.7, 385.54, 381.05 ], "normalized_solution": [ 236, 342, 602, 759 ] }, { "height": 502, "width": 640, "id": 402, "original_id": 587040, "dataset_name": "refcoco", "area": 27243.198099999998, "iscrowd": 0, "image_id": 402, "category_id": 23, "bbox_list": [ [ 151.23, 171.7, 384.53999999999996, 380.04999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580296.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bear on left.", "normal_caption": "bear on left", "solution": [ 151.23, 171.7, 385.54, 381.05 ], "normalized_solution": [ 236, 342, 602, 759 ] }, { "height": 427, "width": 640, "id": 403, "original_id": 1331028, "dataset_name": "refcoco", "area": 26699.820050000006, "iscrowd": 0, "image_id": 403, "category_id": 1, "bbox_list": [ [ 527.53, 55.56, 639.0, 422.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in black next to lady in red.", "normal_caption": "woman in black next to lady in red", "solution": [ 527.53, 55.56, 640.0, 423.28 ], "normalized_solution": [ 824, 130, 1000, 991 ] }, { "height": 427, "width": 640, "id": 404, "original_id": 1331028, "dataset_name": "refcoco", "area": 26699.820050000006, "iscrowd": 0, "image_id": 404, "category_id": 1, "bbox_list": [ [ 527.53, 55.56, 639.0, 422.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right blackwoman.", "normal_caption": "right blackwoman", "solution": [ 527.53, 55.56, 640.0, 423.28 ], "normalized_solution": [ 824, 130, 1000, 991 ] }, { "height": 427, "width": 640, "id": 405, "original_id": 1331028, "dataset_name": "refcoco", "area": 26699.820050000006, "iscrowd": 0, "image_id": 405, "category_id": 1, "bbox_list": [ [ 527.53, 55.56, 639.0, 422.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right.", "normal_caption": "far right", "solution": [ 527.53, 55.56, 640.0, 423.28 ], "normalized_solution": [ 824, 130, 1000, 991 ] }, { "height": 427, "width": 640, "id": 406, "original_id": 1326126, "dataset_name": "refcoco", "area": 31803.99140000001, "iscrowd": 0, "image_id": 406, "category_id": 1, "bbox_list": [ [ 384.78, 60.45, 573.77, 421.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right in red.", "normal_caption": "woman on right in red", "solution": [ 384.78, 60.45, 574.77, 422.2 ], "normalized_solution": [ 601, 141, 898, 988 ] }, { "height": 427, "width": 640, "id": 407, "original_id": 1326126, "dataset_name": "refcoco", "area": 31803.99140000001, "iscrowd": 0, "image_id": 407, "category_id": 1, "bbox_list": [ [ 384.78, 60.45, 573.77, 421.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in red under umbrella.", "normal_caption": "woman in red under umbrella", "solution": [ 384.78, 60.45, 574.77, 422.2 ], "normalized_solution": [ 601, 141, 898, 988 ] }, { "height": 427, "width": 640, "id": 408, "original_id": 1326126, "dataset_name": "refcoco", "area": 31803.99140000001, "iscrowd": 0, "image_id": 408, "category_id": 1, "bbox_list": [ [ 384.78, 60.45, 573.77, 421.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the girl in red on the right.", "normal_caption": "the girl in red on the right", "solution": [ 384.78, 60.45, 574.77, 422.2 ], "normalized_solution": [ 601, 141, 898, 988 ] }, { "height": 427, "width": 640, "id": 409, "original_id": 1314074, "dataset_name": "refcoco", "area": 19232.034550000004, "iscrowd": 0, "image_id": 409, "category_id": 1, "bbox_list": [ [ 0.96, 80.44, 142.93, 404.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady walking with white shirt boots scarf on on the left.", "normal_caption": "lady walking with white shirt boots scarf on on the left", "solution": [ 0.96, 80.44, 143.93, 405.73 ], "normalized_solution": [ 1, 188, 224, 950 ] }, { "height": 427, "width": 640, "id": 410, "original_id": 1314074, "dataset_name": "refcoco", "area": 19232.034550000004, "iscrowd": 0, "image_id": 410, "category_id": 1, "bbox_list": [ [ 0.96, 80.44, 142.93, 404.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: women in red and white on left.", "normal_caption": "women in red and white on left", "solution": [ 0.96, 80.44, 143.93, 405.73 ], "normalized_solution": [ 1, 188, 224, 950 ] }, { "height": 427, "width": 640, "id": 411, "original_id": 1314074, "dataset_name": "refcoco", "area": 19232.034550000004, "iscrowd": 0, "image_id": 411, "category_id": 1, "bbox_list": [ [ 0.96, 80.44, 142.93, 404.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left woman.", "normal_caption": "left woman", "solution": [ 0.96, 80.44, 143.93, 405.73 ], "normalized_solution": [ 1, 188, 224, 950 ] }, { "height": 427, "width": 640, "id": 412, "original_id": 1241701, "dataset_name": "refcoco", "area": 25027.984849999997, "iscrowd": 0, "image_id": 412, "category_id": 1, "bbox_list": [ [ 211.58, 25.49, 347.14, 364.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guitar.", "normal_caption": "guitar", "solution": [ 211.58, 25.49, 348.14, 365.93 ], "normalized_solution": [ 330, 59, 543, 856 ] }, { "height": 427, "width": 640, "id": 413, "original_id": 1241701, "dataset_name": "refcoco", "area": 25027.984849999997, "iscrowd": 0, "image_id": 413, "category_id": 1, "bbox_list": [ [ 211.58, 25.49, 347.14, 364.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guitar guy.", "normal_caption": "guitar guy", "solution": [ 211.58, 25.49, 348.14, 365.93 ], "normalized_solution": [ 330, 59, 543, 856 ] }, { "height": 427, "width": 640, "id": 414, "original_id": 1241701, "dataset_name": "refcoco", "area": 25027.984849999997, "iscrowd": 0, "image_id": 414, "category_id": 1, "bbox_list": [ [ 211.58, 25.49, 347.14, 364.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580277.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guitar guy.", "normal_caption": "guitar guy", "solution": [ 211.58, 25.49, 348.14, 365.93 ], "normalized_solution": [ 330, 59, 543, 856 ] }, { "height": 508, "width": 640, "id": 415, "original_id": 223281, "dataset_name": "refcoco", "area": 72594.55335, "iscrowd": 0, "image_id": 415, "category_id": 1, "bbox_list": [ [ 330.31, 1.14, 563.95, 501.3 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580257.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the large women on the right.", "normal_caption": "the large women on the right", "solution": [ 330.31, 1.14, 564.95, 502.3 ], "normalized_solution": [ 516, 2, 882, 988 ] }, { "height": 508, "width": 640, "id": 416, "original_id": 223281, "dataset_name": "refcoco", "area": 72594.55335, "iscrowd": 0, "image_id": 416, "category_id": 1, "bbox_list": [ [ 330.31, 1.14, 563.95, 501.3 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580257.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bigger woman.", "normal_caption": "bigger woman", "solution": [ 330.31, 1.14, 564.95, 502.3 ], "normalized_solution": [ 516, 2, 882, 988 ] }, { "height": 508, "width": 640, "id": 417, "original_id": 223281, "dataset_name": "refcoco", "area": 72594.55335, "iscrowd": 0, "image_id": 417, "category_id": 1, "bbox_list": [ [ 330.31, 1.14, 563.95, 501.3 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580257.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right woman.", "normal_caption": "right woman", "solution": [ 330.31, 1.14, 564.95, 502.3 ], "normalized_solution": [ 516, 2, 882, 988 ] }, { "height": 508, "width": 640, "id": 418, "original_id": 195788, "dataset_name": "refcoco", "area": 41629.25855000001, "iscrowd": 0, "image_id": 418, "category_id": 1, "bbox_list": [ [ 153.59, 30.15, 399.78999999999996, 501.21999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580257.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady on left those pizza slices looked great.", "normal_caption": "lady on left those pizza slices looked great", "solution": [ 153.59, 30.15, 400.79, 502.22 ], "normalized_solution": [ 239, 59, 626, 988 ] }, { "height": 508, "width": 640, "id": 419, "original_id": 195788, "dataset_name": "refcoco", "area": 41629.25855000001, "iscrowd": 0, "image_id": 419, "category_id": 1, "bbox_list": [ [ 153.59, 30.15, 399.78999999999996, 501.21999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580257.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady on left.", "normal_caption": "lady on left", "solution": [ 153.59, 30.15, 400.79, 502.22 ], "normalized_solution": [ 239, 59, 626, 988 ] }, { "height": 508, "width": 640, "id": 420, "original_id": 195788, "dataset_name": "refcoco", "area": 41629.25855000001, "iscrowd": 0, "image_id": 420, "category_id": 1, "bbox_list": [ [ 153.59, 30.15, 399.78999999999996, 501.21999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580257.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left woman.", "normal_caption": "left woman", "solution": [ 153.59, 30.15, 400.79, 502.22 ], "normalized_solution": [ 239, 59, 626, 988 ] }, { "height": 427, "width": 640, "id": 421, "original_id": 2225384, "dataset_name": "refcoco", "area": 62942.185, "iscrowd": 0, "image_id": 421, "category_id": 63, "bbox_list": [ [ 1.5, 0.0, 470.5, 225.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580234.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sewn hanging behind cat.", "normal_caption": "sewn hanging behind cat", "solution": [ 1.5, 0.0, 471.5, 226.85 ], "normalized_solution": [ 2, 0, 736, 531 ] }, { "height": 427, "width": 640, "id": 422, "original_id": 2225384, "dataset_name": "refcoco", "area": 62942.185, "iscrowd": 0, "image_id": 422, "category_id": 63, "bbox_list": [ [ 1.5, 0.0, 470.5, 225.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580234.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blck above cat.", "normal_caption": "blck above cat", "solution": [ 1.5, 0.0, 471.5, 226.85 ], "normalized_solution": [ 2, 0, 736, 531 ] }, { "height": 427, "width": 640, "id": 423, "original_id": 98770, "dataset_name": "refcoco", "area": 58460.286750000014, "iscrowd": 0, "image_id": 423, "category_id": 63, "bbox_list": [ [ 0.92, 121.21, 561.91, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580234.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: a place for a cat to lay down.", "normal_caption": "a place for a cat to lay down", "solution": [ 0.92, 121.21, 562.91, 427.0 ], "normalized_solution": [ 1, 283, 879, 1000 ] }, { "height": 427, "width": 640, "id": 424, "original_id": 98770, "dataset_name": "refcoco", "area": 58460.286750000014, "iscrowd": 0, "image_id": 424, "category_id": 63, "bbox_list": [ [ 0.92, 121.21, 561.91, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580234.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the cats white bed.", "normal_caption": "the cats white bed", "solution": [ 0.92, 121.21, 562.91, 427.0 ], "normalized_solution": [ 1, 283, 879, 1000 ] }, { "height": 427, "width": 640, "id": 425, "original_id": 98770, "dataset_name": "refcoco", "area": 58460.286750000014, "iscrowd": 0, "image_id": 425, "category_id": 63, "bbox_list": [ [ 0.92, 121.21, 561.91, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580234.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white part of the cats bed.", "normal_caption": "white part of the cats bed", "solution": [ 0.92, 121.21, 562.91, 427.0 ], "normalized_solution": [ 1, 283, 879, 1000 ] }, { "height": 464, "width": 640, "id": 426, "original_id": 1199227, "dataset_name": "refcoco", "area": 19837.948450000007, "iscrowd": 0, "image_id": 426, "category_id": 10, "bbox_list": [ [ 194.98, 200.92, 303.46999999999997, 403.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580142.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: dont walk signal on the left.", "normal_caption": "dont walk signal on the left", "solution": [ 194.98, 200.92, 304.47, 404.25 ], "normalized_solution": [ 304, 433, 475, 871 ] }, { "height": 464, "width": 640, "id": 427, "original_id": 1199227, "dataset_name": "refcoco", "area": 19837.948450000007, "iscrowd": 0, "image_id": 427, "category_id": 10, "bbox_list": [ [ 194.98, 200.92, 303.46999999999997, 403.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580142.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: walk signal.", "normal_caption": "walk signal", "solution": [ 194.98, 200.92, 304.47, 404.25 ], "normalized_solution": [ 304, 433, 475, 871 ] }, { "height": 464, "width": 640, "id": 428, "original_id": 1199227, "dataset_name": "refcoco", "area": 19837.948450000007, "iscrowd": 0, "image_id": 428, "category_id": 10, "bbox_list": [ [ 194.98, 200.92, 303.46999999999997, 403.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580142.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: 16.", "normal_caption": "16", "solution": [ 194.98, 200.92, 304.47, 404.25 ], "normalized_solution": [ 304, 433, 475, 871 ] }, { "height": 464, "width": 640, "id": 429, "original_id": 1198716, "dataset_name": "refcoco", "area": 21447.912300000004, "iscrowd": 0, "image_id": 429, "category_id": 10, "bbox_list": [ [ 321.15, 25.95, 430.67999999999995, 277.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580142.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: stoplight.", "normal_caption": "stoplight", "solution": [ 321.15, 25.95, 431.68, 278.28 ], "normalized_solution": [ 501, 55, 674, 599 ] }, { "height": 464, "width": 640, "id": 430, "original_id": 1198716, "dataset_name": "refcoco", "area": 21447.912300000004, "iscrowd": 0, "image_id": 430, "category_id": 10, "bbox_list": [ [ 321.15, 25.95, 430.67999999999995, 277.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580142.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: righ signal.", "normal_caption": "righ signal", "solution": [ 321.15, 25.95, 431.68, 278.28 ], "normalized_solution": [ 501, 55, 674, 599 ] }, { "height": 464, "width": 640, "id": 431, "original_id": 1198716, "dataset_name": "refcoco", "area": 21447.912300000004, "iscrowd": 0, "image_id": 431, "category_id": 10, "bbox_list": [ [ 321.15, 25.95, 430.67999999999995, 277.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580142.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: green light.", "normal_caption": "green light", "solution": [ 321.15, 25.95, 431.68, 278.28 ], "normalized_solution": [ 501, 55, 674, 599 ] }, { "height": 480, "width": 640, "id": 432, "original_id": 1320948, "dataset_name": "refcoco", "area": 12329.196999999998, "iscrowd": 0, "image_id": 432, "category_id": 1, "bbox_list": [ [ 28.04, 291.24, 180.20999999999998, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580120.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: child bottom left leaning over.", "normal_caption": "child bottom left leaning over", "solution": [ 28.04, 291.24, 181.21, 473.53 ], "normalized_solution": [ 43, 606, 283, 986 ] }, { "height": 480, "width": 640, "id": 433, "original_id": 1320948, "dataset_name": "refcoco", "area": 12329.196999999998, "iscrowd": 0, "image_id": 433, "category_id": 1, "bbox_list": [ [ 28.04, 291.24, 180.20999999999998, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580120.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid white tee lower left.", "normal_caption": "kid white tee lower left", "solution": [ 28.04, 291.24, 181.21, 473.53 ], "normalized_solution": [ 43, 606, 283, 986 ] }, { "height": 480, "width": 640, "id": 434, "original_id": 1320948, "dataset_name": "refcoco", "area": 12329.196999999998, "iscrowd": 0, "image_id": 434, "category_id": 1, "bbox_list": [ [ 28.04, 291.24, 180.20999999999998, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580120.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid left side bent over desk.", "normal_caption": "kid left side bent over desk", "solution": [ 28.04, 291.24, 181.21, 473.53 ], "normalized_solution": [ 43, 606, 283, 986 ] }, { "height": 480, "width": 640, "id": 435, "original_id": 1208097, "dataset_name": "refcoco", "area": 12563.67145, "iscrowd": 0, "image_id": 435, "category_id": 1, "bbox_list": [ [ 144.77, 229.3, 239.84, 409.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580120.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy white shirt.", "normal_caption": "guy white shirt", "solution": [ 144.77, 229.3, 240.84, 410.77 ], "normalized_solution": [ 226, 477, 376, 855 ] }, { "height": 480, "width": 640, "id": 436, "original_id": 1208097, "dataset_name": "refcoco", "area": 12563.67145, "iscrowd": 0, "image_id": 436, "category_id": 1, "bbox_list": [ [ 144.77, 229.3, 239.84, 409.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580120.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: standing boy with glasses.", "normal_caption": "standing boy with glasses", "solution": [ 144.77, 229.3, 240.84, 410.77 ], "normalized_solution": [ 226, 477, 376, 855 ] }, { "height": 480, "width": 640, "id": 437, "original_id": 1208097, "dataset_name": "refcoco", "area": 12563.67145, "iscrowd": 0, "image_id": 437, "category_id": 1, "bbox_list": [ [ 144.77, 229.3, 239.84, 409.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580120.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: buttonup shirt standing.", "normal_caption": "buttonup shirt standing", "solution": [ 144.77, 229.3, 240.84, 410.77 ], "normalized_solution": [ 226, 477, 376, 855 ] }, { "height": 375, "width": 500, "id": 438, "original_id": 236590, "dataset_name": "refcoco", "area": 30520.807149999997, "iscrowd": 0, "image_id": 438, "category_id": 1, "bbox_list": [ [ 129.22, 122.04, 472.82000000000005, 343.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580052.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right kid in white.", "normal_caption": "right kid in white", "solution": [ 129.22, 122.04, 473.82, 344.17 ], "normalized_solution": [ 258, 325, 947, 917 ] }, { "height": 375, "width": 500, "id": 439, "original_id": 236590, "dataset_name": "refcoco", "area": 30520.807149999997, "iscrowd": 0, "image_id": 439, "category_id": 1, "bbox_list": [ [ 129.22, 122.04, 472.82000000000005, 343.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580052.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right boy.", "normal_caption": "right boy", "solution": [ 129.22, 122.04, 473.82, 344.17 ], "normalized_solution": [ 258, 325, 947, 917 ] }, { "height": 375, "width": 500, "id": 440, "original_id": 236590, "dataset_name": "refcoco", "area": 30520.807149999997, "iscrowd": 0, "image_id": 440, "category_id": 1, "bbox_list": [ [ 129.22, 122.04, 472.82000000000005, 343.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580052.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid in white.", "normal_caption": "kid in white", "solution": [ 129.22, 122.04, 473.82, 344.17 ], "normalized_solution": [ 258, 325, 947, 917 ] }, { "height": 375, "width": 500, "id": 441, "original_id": 204741, "dataset_name": "refcoco", "area": 19668.75099999999, "iscrowd": 0, "image_id": 441, "category_id": 1, "bbox_list": [ [ 42.83, 102.3, 290.75, 288.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580052.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy in blue stripes.", "normal_caption": "boy in blue stripes", "solution": [ 42.83, 102.3, 291.75, 289.18 ], "normalized_solution": [ 85, 272, 583, 771 ] }, { "height": 375, "width": 500, "id": 442, "original_id": 204741, "dataset_name": "refcoco", "area": 19668.75099999999, "iscrowd": 0, "image_id": 442, "category_id": 1, "bbox_list": [ [ 42.83, 102.3, 290.75, 288.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580052.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy in blue.", "normal_caption": "boy in blue", "solution": [ 42.83, 102.3, 291.75, 289.18 ], "normalized_solution": [ 85, 272, 583, 771 ] }, { "height": 375, "width": 500, "id": 443, "original_id": 204741, "dataset_name": "refcoco", "area": 19668.75099999999, "iscrowd": 0, "image_id": 443, "category_id": 1, "bbox_list": [ [ 42.83, 102.3, 290.75, 288.18 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580052.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy in stripes.", "normal_caption": "boy in stripes", "solution": [ 42.83, 102.3, 291.75, 289.18 ], "normalized_solution": [ 85, 272, 583, 771 ] }, { "height": 437, "width": 640, "id": 444, "original_id": 1735631, "dataset_name": "refcoco", "area": 25122.75, "iscrowd": 0, "image_id": 444, "category_id": 1, "bbox_list": [ [ 308.5, 193.5, 544.5, 414.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580026.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy in front with white shirt.", "normal_caption": "boy in front with white shirt", "solution": [ 308.5, 193.5, 545.5, 415.0 ], "normalized_solution": [ 482, 442, 852, 949 ] }, { "height": 437, "width": 640, "id": 445, "original_id": 1735631, "dataset_name": "refcoco", "area": 25122.75, "iscrowd": 0, "image_id": 445, "category_id": 1, "bbox_list": [ [ 308.5, 193.5, 544.5, 414.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580026.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy.", "normal_caption": "boy", "solution": [ 308.5, 193.5, 545.5, 415.0 ], "normalized_solution": [ 482, 442, 852, 949 ] }, { "height": 437, "width": 640, "id": 446, "original_id": 1735631, "dataset_name": "refcoco", "area": 25122.75, "iscrowd": 0, "image_id": 446, "category_id": 1, "bbox_list": [ [ 308.5, 193.5, 544.5, 414.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580026.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid in white.", "normal_caption": "kid in white", "solution": [ 308.5, 193.5, 545.5, 415.0 ], "normalized_solution": [ 482, 442, 852, 949 ] }, { "height": 437, "width": 640, "id": 447, "original_id": 1741004, "dataset_name": "refcoco", "area": 11002.7033, "iscrowd": 0, "image_id": 447, "category_id": 1, "bbox_list": [ [ 342.05, 131.64, 477.0, 282.78 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580026.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: little girl at table.", "normal_caption": "little girl at table", "solution": [ 342.05, 131.64, 478.0, 283.78 ], "normalized_solution": [ 534, 301, 746, 649 ] }, { "height": 437, "width": 640, "id": 448, "original_id": 1741004, "dataset_name": "refcoco", "area": 11002.7033, "iscrowd": 0, "image_id": 448, "category_id": 1, "bbox_list": [ [ 342.05, 131.64, 477.0, 282.78 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580026.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 342.05, 131.64, 478.0, 283.78 ], "normalized_solution": [ 534, 301, 746, 649 ] }, { "height": 437, "width": 640, "id": 449, "original_id": 1741004, "dataset_name": "refcoco", "area": 11002.7033, "iscrowd": 0, "image_id": 449, "category_id": 1, "bbox_list": [ [ 342.05, 131.64, 477.0, 282.78 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000580026.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 342.05, 131.64, 478.0, 283.78 ], "normalized_solution": [ 534, 301, 746, 649 ] }, { "height": 426, "width": 640, "id": 450, "original_id": 562284, "dataset_name": "refcoco", "area": 18569.4619, "iscrowd": 0, "image_id": 450, "category_id": 1, "bbox_list": [ [ 1.49, 200.69, 133.89000000000001, 385.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on left.", "normal_caption": "person on left", "solution": [ 1.49, 200.69, 134.89, 386.98 ], "normalized_solution": [ 2, 471, 210, 908 ] }, { "height": 426, "width": 640, "id": 451, "original_id": 562284, "dataset_name": "refcoco", "area": 18569.4619, "iscrowd": 0, "image_id": 451, "category_id": 1, "bbox_list": [ [ 1.49, 200.69, 133.89000000000001, 385.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: fan on the far left in yellow with visible face.", "normal_caption": "fan on the far left in yellow with visible face", "solution": [ 1.49, 200.69, 134.89, 386.98 ], "normalized_solution": [ 2, 471, 210, 908 ] }, { "height": 426, "width": 640, "id": 452, "original_id": 562284, "dataset_name": "refcoco", "area": 18569.4619, "iscrowd": 0, "image_id": 452, "category_id": 1, "bbox_list": [ [ 1.49, 200.69, 133.89000000000001, 385.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person watching on far left.", "normal_caption": "person watching on far left", "solution": [ 1.49, 200.69, 134.89, 386.98 ], "normalized_solution": [ 2, 471, 210, 908 ] }, { "height": 426, "width": 640, "id": 453, "original_id": 453693, "dataset_name": "refcoco", "area": 13069.897949999999, "iscrowd": 0, "image_id": 453, "category_id": 1, "bbox_list": [ [ 425.68, 219.3, 541.79, 389.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blurry person to the right of the players elbow.", "normal_caption": "blurry person to the right of the players elbow", "solution": [ 425.68, 219.3, 542.79, 390.11 ], "normalized_solution": [ 665, 514, 848, 915 ] }, { "height": 426, "width": 640, "id": 454, "original_id": 453693, "dataset_name": "refcoco", "area": 13069.897949999999, "iscrowd": 0, "image_id": 454, "category_id": 1, "bbox_list": [ [ 425.68, 219.3, 541.79, 389.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blurry person to right of players elbow.", "normal_caption": "blurry person to right of players elbow", "solution": [ 425.68, 219.3, 542.79, 390.11 ], "normalized_solution": [ 665, 514, 848, 915 ] }, { "height": 426, "width": 640, "id": 455, "original_id": 453693, "dataset_name": "refcoco", "area": 13069.897949999999, "iscrowd": 0, "image_id": 455, "category_id": 1, "bbox_list": [ [ 425.68, 219.3, 541.79, 389.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black shirt background.", "normal_caption": "black shirt background", "solution": [ 425.68, 219.3, 542.79, 390.11 ], "normalized_solution": [ 665, 514, 848, 915 ] }, { "height": 426, "width": 640, "id": 456, "original_id": 445779, "dataset_name": "refcoco", "area": 39632.328099999984, "iscrowd": 0, "image_id": 456, "category_id": 1, "bbox_list": [ [ 169.44, 119.37, 423.09000000000003, 392.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player.", "normal_caption": "player", "solution": [ 169.44, 119.37, 424.09, 393.16 ], "normalized_solution": [ 264, 280, 662, 922 ] }, { "height": 426, "width": 640, "id": 457, "original_id": 445779, "dataset_name": "refcoco", "area": 39632.328099999984, "iscrowd": 0, "image_id": 457, "category_id": 1, "bbox_list": [ [ 169.44, 119.37, 423.09000000000003, 392.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man with paddle.", "normal_caption": "man with paddle", "solution": [ 169.44, 119.37, 424.09, 393.16 ], "normalized_solution": [ 264, 280, 662, 922 ] }, { "height": 426, "width": 640, "id": 458, "original_id": 445779, "dataset_name": "refcoco", "area": 39632.328099999984, "iscrowd": 0, "image_id": 458, "category_id": 1, "bbox_list": [ [ 169.44, 119.37, 423.09000000000003, 392.16 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579997.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player.", "normal_caption": "player", "solution": [ 169.44, 119.37, 424.09, 393.16 ], "normalized_solution": [ 264, 280, 662, 922 ] }, { "height": 375, "width": 500, "id": 459, "original_id": 1647570, "dataset_name": "refcoco", "area": 27759.529850000006, "iscrowd": 0, "image_id": 459, "category_id": 82, "bbox_list": [ [ 238.48, 43.03, 337.76, 369.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579909.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right fridge door.", "normal_caption": "right fridge door", "solution": [ 238.48, 43.03, 338.76, 370.0 ], "normalized_solution": [ 476, 114, 677, 986 ] }, { "height": 375, "width": 500, "id": 460, "original_id": 1647570, "dataset_name": "refcoco", "area": 27759.529850000006, "iscrowd": 0, "image_id": 460, "category_id": 82, "bbox_list": [ [ 238.48, 43.03, 337.76, 369.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579909.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the panel to the right of the lit up panel.", "normal_caption": "the panel to the right of the lit up panel", "solution": [ 238.48, 43.03, 338.76, 370.0 ], "normalized_solution": [ 476, 114, 677, 986 ] }, { "height": 375, "width": 500, "id": 461, "original_id": 1647570, "dataset_name": "refcoco", "area": 27759.529850000006, "iscrowd": 0, "image_id": 461, "category_id": 82, "bbox_list": [ [ 238.48, 43.03, 337.76, 369.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579909.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right brown.", "normal_caption": "right brown", "solution": [ 238.48, 43.03, 338.76, 370.0 ], "normalized_solution": [ 476, 114, 677, 986 ] }, { "height": 375, "width": 500, "id": 462, "original_id": 331012, "dataset_name": "refcoco", "area": 50171.54604999999, "iscrowd": 0, "image_id": 462, "category_id": 82, "bbox_list": [ [ 49.5, 47.06, 243.13, 374.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579909.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left side of fridge.", "normal_caption": "left side of fridge", "solution": [ 49.5, 47.06, 244.13, 375.0 ], "normalized_solution": [ 99, 125, 488, 1000 ] }, { "height": 375, "width": 500, "id": 463, "original_id": 331012, "dataset_name": "refcoco", "area": 50171.54604999999, "iscrowd": 0, "image_id": 463, "category_id": 82, "bbox_list": [ [ 49.5, 47.06, 243.13, 374.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579909.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: freezer on left with water dispenser.", "normal_caption": "freezer on left with water dispenser", "solution": [ 49.5, 47.06, 244.13, 375.0 ], "normalized_solution": [ 99, 125, 488, 1000 ] }, { "height": 375, "width": 500, "id": 464, "original_id": 331012, "dataset_name": "refcoco", "area": 50171.54604999999, "iscrowd": 0, "image_id": 464, "category_id": 82, "bbox_list": [ [ 49.5, 47.06, 243.13, 374.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579909.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: ice maker on fridge.", "normal_caption": "ice maker on fridge", "solution": [ 49.5, 47.06, 244.13, 375.0 ], "normalized_solution": [ 99, 125, 488, 1000 ] }, { "height": 480, "width": 640, "id": 465, "original_id": 1951361, "dataset_name": "refcoco", "area": 26343.198250000012, "iscrowd": 0, "image_id": 465, "category_id": 63, "bbox_list": [ [ 0.0, 251.41, 210.74, 418.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579907.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the loveseat on the left of the room.", "normal_caption": "the loveseat on the left of the room", "solution": [ 0.0, 251.41, 211.74, 419.35 ], "normalized_solution": [ 0, 523, 330, 873 ] }, { "height": 480, "width": 640, "id": 466, "original_id": 1951361, "dataset_name": "refcoco", "area": 26343.198250000012, "iscrowd": 0, "image_id": 466, "category_id": 63, "bbox_list": [ [ 0.0, 251.41, 210.74, 418.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579907.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left couch.", "normal_caption": "left couch", "solution": [ 0.0, 251.41, 211.74, 419.35 ], "normalized_solution": [ 0, 523, 330, 873 ] }, { "height": 640, "width": 426, "id": 467, "original_id": 1278510, "dataset_name": "refcoco", "area": 11064.101899999998, "iscrowd": 0, "image_id": 467, "category_id": 1, "bbox_list": [ [ 211.8, 399.27, 345.5, 615.5699999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blurry person below batters crotch.", "normal_caption": "blurry person below batters crotch", "solution": [ 211.8, 399.27, 346.5, 616.57 ], "normalized_solution": [ 497, 623, 813, 963 ] }, { "height": 640, "width": 426, "id": 468, "original_id": 1278510, "dataset_name": "refcoco", "area": 11064.101899999998, "iscrowd": 0, "image_id": 468, "category_id": 1, "bbox_list": [ [ 211.8, 399.27, 345.5, 615.5699999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blurry person between batters legs.", "normal_caption": "blurry person between batters legs", "solution": [ 211.8, 399.27, 346.5, 616.57 ], "normalized_solution": [ 497, 623, 813, 963 ] }, { "height": 640, "width": 426, "id": 469, "original_id": 1278510, "dataset_name": "refcoco", "area": 11064.101899999998, "iscrowd": 0, "image_id": 469, "category_id": 1, "bbox_list": [ [ 211.8, 399.27, 345.5, 615.5699999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: spot between player legs.", "normal_caption": "spot between player legs", "solution": [ 211.8, 399.27, 346.5, 616.57 ], "normalized_solution": [ 497, 623, 813, 963 ] }, { "height": 640, "width": 426, "id": 470, "original_id": 1255208, "dataset_name": "refcoco", "area": 10384.684449999999, "iscrowd": 0, "image_id": 470, "category_id": 1, "bbox_list": [ [ 340.97, 352.34, 424.70000000000005, 592.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in the back ground to right.", "normal_caption": "man in the back ground to right", "solution": [ 340.97, 352.34, 425.7, 593.25 ], "normalized_solution": [ 800, 550, 999, 926 ] }, { "height": 640, "width": 426, "id": 471, "original_id": 1255208, "dataset_name": "refcoco", "area": 10384.684449999999, "iscrowd": 0, "image_id": 471, "category_id": 1, "bbox_list": [ [ 340.97, 352.34, 424.70000000000005, 592.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player in the bottom right of pic wearing the hat.", "normal_caption": "player in the bottom right of pic wearing the hat", "solution": [ 340.97, 352.34, 425.7, 593.25 ], "normalized_solution": [ 800, 550, 999, 926 ] }, { "height": 640, "width": 426, "id": 472, "original_id": 1253751, "dataset_name": "refcoco", "area": 66371.6081, "iscrowd": 0, "image_id": 472, "category_id": 1, "bbox_list": [ [ 83.42, 105.08, 384.44, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: baseball man.", "normal_caption": "baseball man", "solution": [ 83.42, 105.08, 385.44, 640.0 ], "normalized_solution": [ 195, 164, 904, 1000 ] }, { "height": 640, "width": 426, "id": 473, "original_id": 1253751, "dataset_name": "refcoco", "area": 66371.6081, "iscrowd": 0, "image_id": 473, "category_id": 1, "bbox_list": [ [ 83.42, 105.08, 384.44, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579901.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 83.42, 105.08, 385.44, 640.0 ], "normalized_solution": [ 195, 164, 904, 1000 ] }, { "height": 480, "width": 640, "id": 474, "original_id": 1820607, "dataset_name": "refcoco", "area": 25120.604499999987, "iscrowd": 0, "image_id": 474, "category_id": 21, "bbox_list": [ [ 517.41, 101.7, 639.0, 384.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: farthest right cow 99.", "normal_caption": "farthest right cow 99", "solution": [ 517.41, 101.7, 640.0, 385.59 ], "normalized_solution": [ 808, 211, 1000, 803 ] }, { "height": 480, "width": 640, "id": 475, "original_id": 1820607, "dataset_name": "refcoco", "area": 25120.604499999987, "iscrowd": 0, "image_id": 475, "category_id": 21, "bbox_list": [ [ 517.41, 101.7, 639.0, 384.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: rightmost black cow tag 99.", "normal_caption": "rightmost black cow tag 99", "solution": [ 517.41, 101.7, 640.0, 385.59 ], "normalized_solution": [ 808, 211, 1000, 803 ] }, { "height": 480, "width": 640, "id": 476, "original_id": 1820515, "dataset_name": "refcoco", "area": 14950.390200000002, "iscrowd": 0, "image_id": 476, "category_id": 21, "bbox_list": [ [ 148.85, 98.57, 515.6, 385.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second cow from top middle.", "normal_caption": "second cow from top middle", "solution": [ 148.85, 98.57, 516.6, 386.49 ], "normalized_solution": [ 232, 205, 807, 805 ] }, { "height": 480, "width": 640, "id": 477, "original_id": 1820515, "dataset_name": "refcoco", "area": 14950.390200000002, "iscrowd": 0, "image_id": 477, "category_id": 21, "bbox_list": [ [ 148.85, 98.57, 515.6, 385.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow right behind front cow.", "normal_caption": "cow right behind front cow", "solution": [ 148.85, 98.57, 516.6, 386.49 ], "normalized_solution": [ 232, 205, 807, 805 ] }, { "height": 480, "width": 640, "id": 478, "original_id": 1820515, "dataset_name": "refcoco", "area": 14950.390200000002, "iscrowd": 0, "image_id": 478, "category_id": 21, "bbox_list": [ [ 148.85, 98.57, 515.6, 385.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bigger cows back.", "normal_caption": "bigger cows back", "solution": [ 148.85, 98.57, 516.6, 386.49 ], "normalized_solution": [ 232, 205, 807, 805 ] }, { "height": 480, "width": 640, "id": 479, "original_id": 73875, "dataset_name": "refcoco", "area": 86482.57764999998, "iscrowd": 0, "image_id": 479, "category_id": 21, "bbox_list": [ [ 71.23, 118.71, 533.71, 408.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front cow.", "normal_caption": "front cow", "solution": [ 71.23, 118.71, 534.71, 409.81 ], "normalized_solution": [ 111, 247, 835, 853 ] }, { "height": 480, "width": 640, "id": 480, "original_id": 73875, "dataset_name": "refcoco", "area": 86482.57764999998, "iscrowd": 0, "image_id": 480, "category_id": 21, "bbox_list": [ [ 71.23, 118.71, 533.71, 408.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow looking at us pissed off.", "normal_caption": "cow looking at us pissed off", "solution": [ 71.23, 118.71, 534.71, 409.81 ], "normalized_solution": [ 111, 247, 835, 853 ] }, { "height": 480, "width": 640, "id": 481, "original_id": 73875, "dataset_name": "refcoco", "area": 86482.57764999998, "iscrowd": 0, "image_id": 481, "category_id": 21, "bbox_list": [ [ 71.23, 118.71, 533.71, 408.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579787.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front cow.", "normal_caption": "front cow", "solution": [ 71.23, 118.71, 534.71, 409.81 ], "normalized_solution": [ 111, 247, 835, 853 ] }, { "height": 427, "width": 640, "id": 482, "original_id": 532897, "dataset_name": "refcoco", "area": 38958.83885, "iscrowd": 0, "image_id": 482, "category_id": 1, "bbox_list": [ [ 126.66, 178.54, 423.12, 420.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle spots.", "normal_caption": "middle spots", "solution": [ 126.66, 178.54, 424.12, 421.31 ], "normalized_solution": [ 197, 418, 662, 986 ] }, { "height": 427, "width": 640, "id": 483, "original_id": 532897, "dataset_name": "refcoco", "area": 38958.83885, "iscrowd": 0, "image_id": 483, "category_id": 1, "bbox_list": [ [ 126.66, 178.54, 423.12, 420.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: animal print shirt.", "normal_caption": "animal print shirt", "solution": [ 126.66, 178.54, 424.12, 421.31 ], "normalized_solution": [ 197, 418, 662, 986 ] }, { "height": 427, "width": 640, "id": 484, "original_id": 532897, "dataset_name": "refcoco", "area": 38958.83885, "iscrowd": 0, "image_id": 484, "category_id": 1, "bbox_list": [ [ 126.66, 178.54, 423.12, 420.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: polka dot shirt.", "normal_caption": "polka dot shirt", "solution": [ 126.66, 178.54, 424.12, 421.31 ], "normalized_solution": [ 197, 418, 662, 986 ] }, { "height": 427, "width": 640, "id": 485, "original_id": 488528, "dataset_name": "refcoco", "area": 58068.02354999998, "iscrowd": 0, "image_id": 485, "category_id": 1, "bbox_list": [ [ 304.86, 80.3, 598.1500000000001, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in gray.", "normal_caption": "girl in gray", "solution": [ 304.86, 80.3, 599.15, 427.0 ], "normalized_solution": [ 476, 188, 936, 1000 ] }, { "height": 427, "width": 640, "id": 486, "original_id": 488528, "dataset_name": "refcoco", "area": 58068.02354999998, "iscrowd": 0, "image_id": 486, "category_id": 1, "bbox_list": [ [ 304.86, 80.3, 598.1500000000001, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: glasses.", "normal_caption": "glasses", "solution": [ 304.86, 80.3, 599.15, 427.0 ], "normalized_solution": [ 476, 188, 936, 1000 ] }, { "height": 427, "width": 640, "id": 487, "original_id": 488528, "dataset_name": "refcoco", "area": 58068.02354999998, "iscrowd": 0, "image_id": 487, "category_id": 1, "bbox_list": [ [ 304.86, 80.3, 598.1500000000001, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl with glasses.", "normal_caption": "girl with glasses", "solution": [ 304.86, 80.3, 599.15, 427.0 ], "normalized_solution": [ 476, 188, 936, 1000 ] }, { "height": 427, "width": 640, "id": 488, "original_id": 454591, "dataset_name": "refcoco", "area": 84486.25124999997, "iscrowd": 0, "image_id": 488, "category_id": 1, "bbox_list": [ [ 0.0, 8.69, 342.89, 419.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: stripe hoodie.", "normal_caption": "stripe hoodie", "solution": [ 0.0, 8.69, 343.89, 420.41 ], "normalized_solution": [ 0, 20, 537, 984 ] }, { "height": 427, "width": 640, "id": 489, "original_id": 454591, "dataset_name": "refcoco", "area": 84486.25124999997, "iscrowd": 0, "image_id": 489, "category_id": 1, "bbox_list": [ [ 0.0, 8.69, 342.89, 419.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy.", "normal_caption": "boy", "solution": [ 0.0, 8.69, 343.89, 420.41 ], "normalized_solution": [ 0, 20, 537, 984 ] }, { "height": 427, "width": 640, "id": 490, "original_id": 454591, "dataset_name": "refcoco", "area": 84486.25124999997, "iscrowd": 0, "image_id": 490, "category_id": 1, "bbox_list": [ [ 0.0, 8.69, 342.89, 419.41 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579785.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: purple striped shirt.", "normal_caption": "purple striped shirt", "solution": [ 0.0, 8.69, 343.89, 420.41 ], "normalized_solution": [ 0, 20, 537, 984 ] }, { "height": 480, "width": 640, "id": 491, "original_id": 440062, "dataset_name": "refcoco", "area": 39819.046899999994, "iscrowd": 0, "image_id": 491, "category_id": 1, "bbox_list": [ [ 377.53, 140.22, 550.1899999999999, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579680.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man right.", "normal_caption": "man right", "solution": [ 377.53, 140.22, 551.19, 474.61 ], "normalized_solution": [ 589, 292, 861, 988 ] }, { "height": 480, "width": 640, "id": 492, "original_id": 440062, "dataset_name": "refcoco", "area": 39819.046899999994, "iscrowd": 0, "image_id": 492, "category_id": 1, "bbox_list": [ [ 377.53, 140.22, 550.1899999999999, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579680.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man gray shirt.", "normal_caption": "man gray shirt", "solution": [ 377.53, 140.22, 551.19, 474.61 ], "normalized_solution": [ 589, 292, 861, 988 ] }, { "height": 480, "width": 640, "id": 493, "original_id": 440062, "dataset_name": "refcoco", "area": 39819.046899999994, "iscrowd": 0, "image_id": 493, "category_id": 1, "bbox_list": [ [ 377.53, 140.22, 550.1899999999999, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579680.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right guy.", "normal_caption": "right guy", "solution": [ 377.53, 140.22, 551.19, 474.61 ], "normalized_solution": [ 589, 292, 861, 988 ] }, { "height": 480, "width": 640, "id": 494, "original_id": 426645, "dataset_name": "refcoco", "area": 46752.659999999974, "iscrowd": 0, "image_id": 494, "category_id": 1, "bbox_list": [ [ 176.5, 110.64, 384.28999999999996, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579680.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on left.", "normal_caption": "guy on left", "solution": [ 176.5, 110.64, 385.29, 480.0 ], "normalized_solution": [ 275, 230, 602, 1000 ] }, { "height": 480, "width": 640, "id": 495, "original_id": 426645, "dataset_name": "refcoco", "area": 46752.659999999974, "iscrowd": 0, "image_id": 495, "category_id": 1, "bbox_list": [ [ 176.5, 110.64, 384.28999999999996, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579680.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man white shirt.", "normal_caption": "man white shirt", "solution": [ 176.5, 110.64, 385.29, 480.0 ], "normalized_solution": [ 275, 230, 602, 1000 ] }, { "height": 612, "width": 612, "id": 496, "original_id": 1293242, "dataset_name": "refcoco", "area": 14095.864699999996, "iscrowd": 0, "image_id": 496, "category_id": 1, "bbox_list": [ [ 460.72, 244.8, 606.87, 443.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl right in red.", "normal_caption": "girl right in red", "solution": [ 460.72, 244.8, 607.87, 444.22 ], "normalized_solution": [ 752, 400, 993, 725 ] }, { "height": 612, "width": 612, "id": 497, "original_id": 1293242, "dataset_name": "refcoco", "area": 14095.864699999996, "iscrowd": 0, "image_id": 497, "category_id": 1, "bbox_list": [ [ 460.72, 244.8, 606.87, 443.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in pink on right side front.", "normal_caption": "girl in pink on right side front", "solution": [ 460.72, 244.8, 607.87, 444.22 ], "normalized_solution": [ 752, 400, 993, 725 ] }, { "height": 612, "width": 612, "id": 498, "original_id": 1223451, "dataset_name": "refcoco", "area": 11143.262899999996, "iscrowd": 0, "image_id": 498, "category_id": 1, "bbox_list": [ [ 94.65, 154.08, 212.21, 345.95000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy on left in the middle with red shirt and blond hair.", "normal_caption": "boy on left in the middle with red shirt and blond hair", "solution": [ 94.65, 154.08, 213.21, 346.95 ], "normalized_solution": [ 154, 251, 348, 566 ] }, { "height": 612, "width": 612, "id": 499, "original_id": 1223451, "dataset_name": "refcoco", "area": 11143.262899999996, "iscrowd": 0, "image_id": 499, "category_id": 1, "bbox_list": [ [ 94.65, 154.08, 212.21, 345.95000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blond boy in red shirt with white stripes.", "normal_caption": "blond boy in red shirt with white stripes", "solution": [ 94.65, 154.08, 213.21, 346.95 ], "normalized_solution": [ 154, 251, 348, 566 ] }, { "height": 612, "width": 612, "id": 500, "original_id": 1223451, "dataset_name": "refcoco", "area": 11143.262899999996, "iscrowd": 0, "image_id": 500, "category_id": 1, "bbox_list": [ [ 94.65, 154.08, 212.21, 345.95000000000005 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blond boy standing on left.", "normal_caption": "blond boy standing on left", "solution": [ 94.65, 154.08, 213.21, 346.95 ], "normalized_solution": [ 154, 251, 348, 566 ] }, { "height": 612, "width": 612, "id": 501, "original_id": 1323748, "dataset_name": "refcoco", "area": 17575.199049999996, "iscrowd": 0, "image_id": 501, "category_id": 1, "bbox_list": [ [ 207.67, 460.72, 356.57, 604.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom middle head.", "normal_caption": "bottom middle head", "solution": [ 207.67, 460.72, 357.57, 605.12 ], "normalized_solution": [ 339, 752, 584, 988 ] }, { "height": 612, "width": 612, "id": 502, "original_id": 1323748, "dataset_name": "refcoco", "area": 17575.199049999996, "iscrowd": 0, "image_id": 502, "category_id": 1, "bbox_list": [ [ 207.67, 460.72, 356.57, 604.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top of head bottom middle.", "normal_caption": "top of head bottom middle", "solution": [ 207.67, 460.72, 357.57, 605.12 ], "normalized_solution": [ 339, 752, 584, 988 ] }, { "height": 612, "width": 612, "id": 503, "original_id": 1323748, "dataset_name": "refcoco", "area": 17575.199049999996, "iscrowd": 0, "image_id": 503, "category_id": 1, "bbox_list": [ [ 207.67, 460.72, 356.57, 604.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the head thats at the bottom middle.", "normal_caption": "the head thats at the bottom middle", "solution": [ 207.67, 460.72, 357.57, 605.12 ], "normalized_solution": [ 339, 752, 584, 988 ] }, { "height": 612, "width": 612, "id": 504, "original_id": 1309311, "dataset_name": "refcoco", "area": 32395.045999999995, "iscrowd": 0, "image_id": 504, "category_id": 1, "bbox_list": [ [ 0.0, 222.21, 190.17, 564.19 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in black dress on left.", "normal_caption": "girl in black dress on left", "solution": [ 0.0, 222.21, 191.17, 565.19 ], "normalized_solution": [ 0, 363, 312, 923 ] }, { "height": 612, "width": 612, "id": 505, "original_id": 1309311, "dataset_name": "refcoco", "area": 32395.045999999995, "iscrowd": 0, "image_id": 505, "category_id": 1, "bbox_list": [ [ 0.0, 222.21, 190.17, 564.19 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left kid in blk.", "normal_caption": "left kid in blk", "solution": [ 0.0, 222.21, 191.17, 565.19 ], "normalized_solution": [ 0, 363, 312, 923 ] }, { "height": 612, "width": 612, "id": 506, "original_id": 1309311, "dataset_name": "refcoco", "area": 32395.045999999995, "iscrowd": 0, "image_id": 506, "category_id": 1, "bbox_list": [ [ 0.0, 222.21, 190.17, 564.19 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 0.0, 222.21, 191.17, 565.19 ], "normalized_solution": [ 0, 363, 312, 923 ] }, { "height": 612, "width": 612, "id": 507, "original_id": 1306923, "dataset_name": "refcoco", "area": 17018.0026, "iscrowd": 0, "image_id": 507, "category_id": 1, "bbox_list": [ [ 0.0, 315.57, 133.29, 611.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left kid.", "normal_caption": "bottom left kid", "solution": [ 0.0, 315.57, 134.29, 612.0 ], "normalized_solution": [ 0, 515, 219, 1000 ] }, { "height": 612, "width": 612, "id": 508, "original_id": 1306923, "dataset_name": "refcoco", "area": 17018.0026, "iscrowd": 0, "image_id": 508, "category_id": 1, "bbox_list": [ [ 0.0, 315.57, 133.29, 611.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579663.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left person.", "normal_caption": "bottom left person", "solution": [ 0.0, 315.57, 134.29, 612.0 ], "normalized_solution": [ 0, 515, 219, 1000 ] }, { "height": 427, "width": 640, "id": 509, "original_id": 310646, "dataset_name": "refcoco", "area": 48200.633200000004, "iscrowd": 0, "image_id": 509, "category_id": 54, "bbox_list": [ [ 0.96, 0.91, 261.33, 289.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579632.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: burger in back.", "normal_caption": "burger in back", "solution": [ 0.96, 0.91, 262.33, 290.04 ], "normalized_solution": [ 1, 2, 409, 679 ] }, { "height": 427, "width": 640, "id": 510, "original_id": 310646, "dataset_name": "refcoco", "area": 48200.633200000004, "iscrowd": 0, "image_id": 510, "category_id": 54, "bbox_list": [ [ 0.96, 0.91, 261.33, 289.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579632.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sandwich on far left.", "normal_caption": "sandwich on far left", "solution": [ 0.96, 0.91, 262.33, 290.04 ], "normalized_solution": [ 1, 2, 409, 679 ] }, { "height": 427, "width": 640, "id": 511, "original_id": 310646, "dataset_name": "refcoco", "area": 48200.633200000004, "iscrowd": 0, "image_id": 511, "category_id": 54, "bbox_list": [ [ 0.96, 0.91, 261.33, 289.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579632.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left half of sandwich.", "normal_caption": "left half of sandwich", "solution": [ 0.96, 0.91, 262.33, 290.04 ], "normalized_solution": [ 1, 2, 409, 679 ] }, { "height": 427, "width": 640, "id": 512, "original_id": 308187, "dataset_name": "refcoco", "area": 106964.33640000004, "iscrowd": 0, "image_id": 512, "category_id": 54, "bbox_list": [ [ 152.84, 0.14, 601.77, 314.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579632.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: burger on the right.", "normal_caption": "burger on the right", "solution": [ 152.84, 0.14, 602.77, 315.37 ], "normalized_solution": [ 238, 0, 941, 738 ] }, { "height": 427, "width": 640, "id": 513, "original_id": 308187, "dataset_name": "refcoco", "area": 106964.33640000004, "iscrowd": 0, "image_id": 513, "category_id": 54, "bbox_list": [ [ 152.84, 0.14, 601.77, 314.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579632.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle sandwich.", "normal_caption": "middle sandwich", "solution": [ 152.84, 0.14, 602.77, 315.37 ], "normalized_solution": [ 238, 0, 941, 738 ] }, { "height": 427, "width": 640, "id": 514, "original_id": 308187, "dataset_name": "refcoco", "area": 106964.33640000004, "iscrowd": 0, "image_id": 514, "category_id": 54, "bbox_list": [ [ 152.84, 0.14, 601.77, 314.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579632.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: burger on the right.", "normal_caption": "burger on the right", "solution": [ 152.84, 0.14, 602.77, 315.37 ], "normalized_solution": [ 238, 0, 941, 738 ] }, { "height": 427, "width": 640, "id": 515, "original_id": 1057163, "dataset_name": "refcoco", "area": 12105.611350000001, "iscrowd": 0, "image_id": 515, "category_id": 56, "bbox_list": [ [ 274.64, 4.01, 457.07, 117.28 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top brocolli just right of center.", "normal_caption": "top brocolli just right of center", "solution": [ 274.64, 4.01, 458.07, 118.28 ], "normalized_solution": [ 429, 9, 715, 277 ] }, { "height": 427, "width": 640, "id": 516, "original_id": 1057163, "dataset_name": "refcoco", "area": 12105.611350000001, "iscrowd": 0, "image_id": 516, "category_id": 56, "bbox_list": [ [ 274.64, 4.01, 457.07, 117.28 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top most broccoli piece.", "normal_caption": "top most broccoli piece", "solution": [ 274.64, 4.01, 458.07, 118.28 ], "normalized_solution": [ 429, 9, 715, 277 ] }, { "height": 427, "width": 640, "id": 517, "original_id": 1057163, "dataset_name": "refcoco", "area": 12105.611350000001, "iscrowd": 0, "image_id": 517, "category_id": 56, "bbox_list": [ [ 274.64, 4.01, 457.07, 117.28 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brocolli back of bowl center right.", "normal_caption": "brocolli back of bowl center right", "solution": [ 274.64, 4.01, 458.07, 118.28 ], "normalized_solution": [ 429, 9, 715, 277 ] }, { "height": 427, "width": 640, "id": 518, "original_id": 1055753, "dataset_name": "refcoco", "area": 26154.560749999997, "iscrowd": 0, "image_id": 518, "category_id": 56, "bbox_list": [ [ 175.81, 168.66, 338.43, 394.09000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: brocolli bottom center.", "normal_caption": "brocolli bottom center", "solution": [ 175.81, 168.66, 339.43, 395.09 ], "normalized_solution": [ 274, 394, 530, 925 ] }, { "height": 427, "width": 640, "id": 519, "original_id": 1055753, "dataset_name": "refcoco", "area": 26154.560749999997, "iscrowd": 0, "image_id": 519, "category_id": 56, "bbox_list": [ [ 175.81, 168.66, 338.43, 394.09000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579631.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccoli closest to the bottom with sesame seeds.", "normal_caption": "broccoli closest to the bottom with sesame seeds", "solution": [ 175.81, 168.66, 339.43, 395.09 ], "normalized_solution": [ 274, 394, 530, 925 ] }, { "height": 374, "width": 500, "id": 520, "original_id": 543651, "dataset_name": "refcoco", "area": 17502.938250000003, "iscrowd": 0, "image_id": 520, "category_id": 1, "bbox_list": [ [ 315.17, 124.39, 444.44000000000005, 368.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579571.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on right.", "normal_caption": "man on right", "solution": [ 315.17, 124.39, 445.44, 369.8 ], "normalized_solution": [ 630, 332, 890, 988 ] }, { "height": 374, "width": 500, "id": 521, "original_id": 543651, "dataset_name": "refcoco", "area": 17502.938250000003, "iscrowd": 0, "image_id": 521, "category_id": 1, "bbox_list": [ [ 315.17, 124.39, 444.44000000000005, 368.8 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579571.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right person.", "normal_caption": "right person", "solution": [ 315.17, 124.39, 445.44, 369.8 ], "normalized_solution": [ 630, 332, 890, 988 ] }, { "height": 374, "width": 500, "id": 522, "original_id": 536345, "dataset_name": "refcoco", "area": 13041.53785, "iscrowd": 0, "image_id": 522, "category_id": 1, "bbox_list": [ [ 88.35, 110.48, 173.51999999999998, 366.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579571.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left man red.", "normal_caption": "left man red", "solution": [ 88.35, 110.48, 174.52, 367.93 ], "normalized_solution": [ 176, 295, 349, 983 ] }, { "height": 374, "width": 500, "id": 523, "original_id": 536345, "dataset_name": "refcoco", "area": 13041.53785, "iscrowd": 0, "image_id": 523, "category_id": 1, "bbox_list": [ [ 88.35, 110.48, 173.51999999999998, 366.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579571.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in red jacket on left smiling.", "normal_caption": "man in red jacket on left smiling", "solution": [ 88.35, 110.48, 174.52, 367.93 ], "normalized_solution": [ 176, 295, 349, 983 ] }, { "height": 374, "width": 500, "id": 524, "original_id": 536345, "dataset_name": "refcoco", "area": 13041.53785, "iscrowd": 0, "image_id": 524, "category_id": 1, "bbox_list": [ [ 88.35, 110.48, 173.51999999999998, 366.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579571.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left man.", "normal_caption": "left man", "solution": [ 88.35, 110.48, 174.52, 367.93 ], "normalized_solution": [ 176, 295, 349, 983 ] }, { "height": 457, "width": 640, "id": 525, "original_id": 1256584, "dataset_name": "refcoco", "area": 22599.645950000006, "iscrowd": 0, "image_id": 525, "category_id": 1, "bbox_list": [ [ 464.19, 107.83, 565.89, 438.53999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: asian male in glasses and suit blue tie.", "normal_caption": "asian male in glasses and suit blue tie", "solution": [ 464.19, 107.83, 566.89, 439.54 ], "normalized_solution": [ 725, 235, 885, 961 ] }, { "height": 457, "width": 640, "id": 526, "original_id": 1256584, "dataset_name": "refcoco", "area": 22599.645950000006, "iscrowd": 0, "image_id": 526, "category_id": 1, "bbox_list": [ [ 464.19, 107.83, 565.89, 438.53999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in blue striped tie.", "normal_caption": "man in blue striped tie", "solution": [ 464.19, 107.83, 566.89, 439.54 ], "normalized_solution": [ 725, 235, 885, 961 ] }, { "height": 457, "width": 640, "id": 527, "original_id": 1256584, "dataset_name": "refcoco", "area": 22599.645950000006, "iscrowd": 0, "image_id": 527, "category_id": 1, "bbox_list": [ [ 464.19, 107.83, 565.89, 438.53999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man with tie.", "normal_caption": "man with tie", "solution": [ 464.19, 107.83, 566.89, 439.54 ], "normalized_solution": [ 725, 235, 885, 961 ] }, { "height": 457, "width": 640, "id": 528, "original_id": 1233912, "dataset_name": "refcoco", "area": 56295.6542, "iscrowd": 0, "image_id": 528, "category_id": 1, "bbox_list": [ [ 189.39, 22.13, 478.64, 456.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in blue.", "normal_caption": "guy in blue", "solution": [ 189.39, 22.13, 479.64, 457.0 ], "normalized_solution": [ 295, 48, 749, 1000 ] }, { "height": 457, "width": 640, "id": 529, "original_id": 1233912, "dataset_name": "refcoco", "area": 56295.6542, "iscrowd": 0, "image_id": 529, "category_id": 1, "bbox_list": [ [ 189.39, 22.13, 478.64, 456.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: officer in black.", "normal_caption": "officer in black", "solution": [ 189.39, 22.13, 479.64, 457.0 ], "normalized_solution": [ 295, 48, 749, 1000 ] }, { "height": 457, "width": 640, "id": 530, "original_id": 1233912, "dataset_name": "refcoco", "area": 56295.6542, "iscrowd": 0, "image_id": 530, "category_id": 1, "bbox_list": [ [ 189.39, 22.13, 478.64, 456.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on right who is shaking hands.", "normal_caption": "guy on right who is shaking hands", "solution": [ 189.39, 22.13, 479.64, 457.0 ], "normalized_solution": [ 295, 48, 749, 1000 ] }, { "height": 457, "width": 640, "id": 531, "original_id": 1229255, "dataset_name": "refcoco", "area": 41547.480350000005, "iscrowd": 0, "image_id": 531, "category_id": 1, "bbox_list": [ [ 21.84, 23.51, 235.15, 456.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white soilder.", "normal_caption": "white soilder", "solution": [ 21.84, 23.51, 236.15, 457.0 ], "normalized_solution": [ 34, 51, 368, 1000 ] }, { "height": 457, "width": 640, "id": 532, "original_id": 1229255, "dataset_name": "refcoco", "area": 41547.480350000005, "iscrowd": 0, "image_id": 532, "category_id": 1, "bbox_list": [ [ 21.84, 23.51, 235.15, 456.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sailor on left.", "normal_caption": "sailor on left", "solution": [ 21.84, 23.51, 236.15, 457.0 ], "normalized_solution": [ 34, 51, 368, 1000 ] }, { "height": 457, "width": 640, "id": 533, "original_id": 1229255, "dataset_name": "refcoco", "area": 41547.480350000005, "iscrowd": 0, "image_id": 533, "category_id": 1, "bbox_list": [ [ 21.84, 23.51, 235.15, 456.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579533.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white guy in white.", "normal_caption": "white guy in white", "solution": [ 21.84, 23.51, 236.15, 457.0 ], "normalized_solution": [ 34, 51, 368, 1000 ] }, { "height": 640, "width": 480, "id": 534, "original_id": 101327, "dataset_name": "refcoco", "area": 16099.130900000004, "iscrowd": 0, "image_id": 534, "category_id": 62, "bbox_list": [ [ 177.55, 496.86, 380.25, 632.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right red chair.", "normal_caption": "far right red chair", "solution": [ 177.55, 496.86, 381.25, 633.12 ], "normalized_solution": [ 369, 776, 794, 989 ] }, { "height": 640, "width": 480, "id": 535, "original_id": 101327, "dataset_name": "refcoco", "area": 16099.130900000004, "iscrowd": 0, "image_id": 535, "category_id": 62, "bbox_list": [ [ 177.55, 496.86, 380.25, 632.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red chair lowest.", "normal_caption": "red chair lowest", "solution": [ 177.55, 496.86, 381.25, 633.12 ], "normalized_solution": [ 369, 776, 794, 989 ] }, { "height": 640, "width": 480, "id": 536, "original_id": 101327, "dataset_name": "refcoco", "area": 16099.130900000004, "iscrowd": 0, "image_id": 536, "category_id": 62, "bbox_list": [ [ 177.55, 496.86, 380.25, 632.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579446.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right most red chair.", "normal_caption": "right most red chair", "solution": [ 177.55, 496.86, 381.25, 633.12 ], "normalized_solution": [ 369, 776, 794, 989 ] }, { "height": 640, "width": 615, "id": 537, "original_id": 496517, "dataset_name": "refcoco", "area": 46183.673, "iscrowd": 0, "image_id": 537, "category_id": 1, "bbox_list": [ [ 292.7, 128.47, 442.2, 638.1 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579395.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl on right.", "normal_caption": "girl on right", "solution": [ 292.7, 128.47, 443.2, 639.1 ], "normalized_solution": [ 475, 200, 720, 998 ] }, { "height": 640, "width": 615, "id": 538, "original_id": 496517, "dataset_name": "refcoco", "area": 46183.673, "iscrowd": 0, "image_id": 538, "category_id": 1, "bbox_list": [ [ 292.7, 128.47, 442.2, 638.1 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579395.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right girl.", "normal_caption": "right girl", "solution": [ 292.7, 128.47, 443.2, 639.1 ], "normalized_solution": [ 475, 200, 720, 998 ] }, { "height": 640, "width": 615, "id": 539, "original_id": 496517, "dataset_name": "refcoco", "area": 46183.673, "iscrowd": 0, "image_id": 539, "category_id": 1, "bbox_list": [ [ 292.7, 128.47, 442.2, 638.1 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579395.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl right.", "normal_caption": "girl right", "solution": [ 292.7, 128.47, 443.2, 639.1 ], "normalized_solution": [ 475, 200, 720, 998 ] }, { "height": 640, "width": 615, "id": 540, "original_id": 445377, "dataset_name": "refcoco", "area": 62255.96825000002, "iscrowd": 0, "image_id": 540, "category_id": 1, "bbox_list": [ [ 124.84, 102.05, 316.13, 630.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579395.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in orange top.", "normal_caption": "girl in orange top", "solution": [ 124.84, 102.05, 317.13, 631.56 ], "normalized_solution": [ 202, 159, 515, 986 ] }, { "height": 640, "width": 615, "id": 541, "original_id": 445377, "dataset_name": "refcoco", "area": 62255.96825000002, "iscrowd": 0, "image_id": 541, "category_id": 1, "bbox_list": [ [ 124.84, 102.05, 316.13, 630.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579395.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange.", "normal_caption": "orange", "solution": [ 124.84, 102.05, 317.13, 631.56 ], "normalized_solution": [ 202, 159, 515, 986 ] }, { "height": 640, "width": 615, "id": 542, "original_id": 445377, "dataset_name": "refcoco", "area": 62255.96825000002, "iscrowd": 0, "image_id": 542, "category_id": 1, "bbox_list": [ [ 124.84, 102.05, 316.13, 630.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579395.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange shirt.", "normal_caption": "orange shirt", "solution": [ 124.84, 102.05, 317.13, 631.56 ], "normalized_solution": [ 202, 159, 515, 986 ] }, { "height": 640, "width": 480, "id": 543, "original_id": 155323, "dataset_name": "refcoco", "area": 33086.08140000001, "iscrowd": 0, "image_id": 543, "category_id": 4, "bbox_list": [ [ 253.12, 70.83, 469.28999999999996, 402.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579382.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bike right.", "normal_caption": "bike right", "solution": [ 253.12, 70.83, 470.29, 403.06 ], "normalized_solution": [ 527, 110, 979, 629 ] }, { "height": 640, "width": 480, "id": 544, "original_id": 155323, "dataset_name": "refcoco", "area": 33086.08140000001, "iscrowd": 0, "image_id": 544, "category_id": 4, "bbox_list": [ [ 253.12, 70.83, 469.28999999999996, 402.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579382.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the black motorcycle.", "normal_caption": "the black motorcycle", "solution": [ 253.12, 70.83, 470.29, 403.06 ], "normalized_solution": [ 527, 110, 979, 629 ] }, { "height": 640, "width": 480, "id": 545, "original_id": 154842, "dataset_name": "refcoco", "area": 73600.88445000004, "iscrowd": 0, "image_id": 545, "category_id": 4, "bbox_list": [ [ 35.87, 14.35, 314.7, 570.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579382.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: motorcycle in front.", "normal_caption": "motorcycle in front", "solution": [ 35.87, 14.35, 315.7, 571.12 ], "normalized_solution": [ 74, 22, 657, 892 ] }, { "height": 640, "width": 480, "id": 546, "original_id": 154842, "dataset_name": "refcoco", "area": 73600.88445000004, "iscrowd": 0, "image_id": 546, "category_id": 4, "bbox_list": [ [ 35.87, 14.35, 314.7, 570.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579382.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bike infront of you.", "normal_caption": "bike infront of you", "solution": [ 35.87, 14.35, 315.7, 571.12 ], "normalized_solution": [ 74, 22, 657, 892 ] }, { "height": 425, "width": 640, "id": 547, "original_id": 585367, "dataset_name": "refcoco", "area": 11559.576400000004, "iscrowd": 0, "image_id": 547, "category_id": 22, "bbox_list": [ [ 153.91, 151.52, 299.51, 281.72 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579366.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: elephant on left.", "normal_caption": "elephant on left", "solution": [ 153.91, 151.52, 300.51, 282.72 ], "normalized_solution": [ 240, 356, 469, 665 ] }, { "height": 425, "width": 640, "id": 548, "original_id": 585367, "dataset_name": "refcoco", "area": 11559.576400000004, "iscrowd": 0, "image_id": 548, "category_id": 22, "bbox_list": [ [ 153.91, 151.52, 299.51, 281.72 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579366.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: elephant on left.", "normal_caption": "elephant on left", "solution": [ 153.91, 151.52, 300.51, 282.72 ], "normalized_solution": [ 240, 356, 469, 665 ] }, { "height": 425, "width": 640, "id": 549, "original_id": 585367, "dataset_name": "refcoco", "area": 11559.576400000004, "iscrowd": 0, "image_id": 549, "category_id": 22, "bbox_list": [ [ 153.91, 151.52, 299.51, 281.72 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579366.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lil elephant.", "normal_caption": "lil elephant", "solution": [ 153.91, 151.52, 300.51, 282.72 ], "normalized_solution": [ 240, 356, 469, 665 ] }, { "height": 425, "width": 640, "id": 550, "original_id": 584990, "dataset_name": "refcoco", "area": 16621.4252, "iscrowd": 0, "image_id": 550, "category_id": 22, "bbox_list": [ [ 286.22, 74.85, 396.05, 282.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579366.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: large elephant center.", "normal_caption": "large elephant center", "solution": [ 286.22, 74.85, 397.05, 283.98 ], "normalized_solution": [ 447, 176, 620, 668 ] }, { "height": 425, "width": 640, "id": 551, "original_id": 584990, "dataset_name": "refcoco", "area": 16621.4252, "iscrowd": 0, "image_id": 551, "category_id": 22, "bbox_list": [ [ 286.22, 74.85, 396.05, 282.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579366.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: center e.", "normal_caption": "center e", "solution": [ 286.22, 74.85, 397.05, 283.98 ], "normalized_solution": [ 447, 176, 620, 668 ] }, { "height": 425, "width": 640, "id": 552, "original_id": 584990, "dataset_name": "refcoco", "area": 16621.4252, "iscrowd": 0, "image_id": 552, "category_id": 22, "bbox_list": [ [ 286.22, 74.85, 396.05, 282.98 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579366.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bigger elephant.", "normal_caption": "bigger elephant", "solution": [ 286.22, 74.85, 397.05, 283.98 ], "normalized_solution": [ 447, 176, 620, 668 ] }, { "height": 427, "width": 640, "id": 553, "original_id": 515214, "dataset_name": "refcoco", "area": 47992.157100000004, "iscrowd": 0, "image_id": 553, "category_id": 1, "bbox_list": [ [ 11.54, 105.31, 252.89, 421.67 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man front left.", "normal_caption": "man front left", "solution": [ 11.54, 105.31, 253.89, 422.67 ], "normalized_solution": [ 18, 246, 396, 989 ] }, { "height": 427, "width": 640, "id": 554, "original_id": 515214, "dataset_name": "refcoco", "area": 47992.157100000004, "iscrowd": 0, "image_id": 554, "category_id": 1, "bbox_list": [ [ 11.54, 105.31, 252.89, 421.67 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on the left.", "normal_caption": "man on the left", "solution": [ 11.54, 105.31, 253.89, 422.67 ], "normalized_solution": [ 18, 246, 396, 989 ] }, { "height": 427, "width": 640, "id": 555, "original_id": 515214, "dataset_name": "refcoco", "area": 47992.157100000004, "iscrowd": 0, "image_id": 555, "category_id": 1, "bbox_list": [ [ 11.54, 105.31, 252.89, 421.67 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on left.", "normal_caption": "man on left", "solution": [ 11.54, 105.31, 253.89, 422.67 ], "normalized_solution": [ 18, 246, 396, 989 ] }, { "height": 427, "width": 640, "id": 556, "original_id": 511270, "dataset_name": "refcoco", "area": 10940.3983, "iscrowd": 0, "image_id": 556, "category_id": 1, "bbox_list": [ [ 201.93, 106.59, 301.24, 301.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man red shirt in back lonely.", "normal_caption": "man red shirt in back lonely", "solution": [ 201.93, 106.59, 302.24, 302.25 ], "normalized_solution": [ 315, 249, 472, 707 ] }, { "height": 427, "width": 640, "id": 557, "original_id": 511270, "dataset_name": "refcoco", "area": 10940.3983, "iscrowd": 0, "image_id": 557, "category_id": 1, "bbox_list": [ [ 201.93, 106.59, 301.24, 301.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in the back in red.", "normal_caption": "man in the back in red", "solution": [ 201.93, 106.59, 302.24, 302.25 ], "normalized_solution": [ 315, 249, 472, 707 ] }, { "height": 427, "width": 640, "id": 558, "original_id": 511270, "dataset_name": "refcoco", "area": 10940.3983, "iscrowd": 0, "image_id": 558, "category_id": 1, "bbox_list": [ [ 201.93, 106.59, 301.24, 301.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in kitchen.", "normal_caption": "guy in kitchen", "solution": [ 201.93, 106.59, 302.24, 302.25 ], "normalized_solution": [ 315, 249, 472, 707 ] }, { "height": 427, "width": 640, "id": 559, "original_id": 439647, "dataset_name": "refcoco", "area": 16177.019700000003, "iscrowd": 0, "image_id": 559, "category_id": 1, "bbox_list": [ [ 272.86, 124.99, 441.39, 418.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in red.", "normal_caption": "woman in red", "solution": [ 272.86, 124.99, 442.39, 419.79 ], "normalized_solution": [ 426, 292, 691, 983 ] }, { "height": 427, "width": 640, "id": 560, "original_id": 439647, "dataset_name": "refcoco", "area": 16177.019700000003, "iscrowd": 0, "image_id": 560, "category_id": 1, "bbox_list": [ [ 272.86, 124.99, 441.39, 418.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in red shirt next to black shirt.", "normal_caption": "woman in red shirt next to black shirt", "solution": [ 272.86, 124.99, 442.39, 419.79 ], "normalized_solution": [ 426, 292, 691, 983 ] }, { "height": 427, "width": 640, "id": 561, "original_id": 437136, "dataset_name": "refcoco", "area": 31216.44520000001, "iscrowd": 0, "image_id": 561, "category_id": 1, "bbox_list": [ [ 387.27, 133.2, 554.87, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady in blue.", "normal_caption": "lady in blue", "solution": [ 387.27, 133.2, 555.87, 427.0 ], "normalized_solution": [ 605, 311, 868, 1000 ] }, { "height": 427, "width": 640, "id": 562, "original_id": 437136, "dataset_name": "refcoco", "area": 31216.44520000001, "iscrowd": 0, "image_id": 562, "category_id": 1, "bbox_list": [ [ 387.27, 133.2, 554.87, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person far right.", "normal_caption": "person far right", "solution": [ 387.27, 133.2, 555.87, 427.0 ], "normalized_solution": [ 605, 311, 868, 1000 ] }, { "height": 427, "width": 640, "id": 563, "original_id": 437136, "dataset_name": "refcoco", "area": 31216.44520000001, "iscrowd": 0, "image_id": 563, "category_id": 1, "bbox_list": [ [ 387.27, 133.2, 554.87, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579332.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right.", "normal_caption": "woman on right", "solution": [ 387.27, 133.2, 555.87, 427.0 ], "normalized_solution": [ 605, 311, 868, 1000 ] }, { "height": 480, "width": 640, "id": 564, "original_id": 1966298, "dataset_name": "refcoco", "area": 25058.675000000007, "iscrowd": 0, "image_id": 564, "category_id": 67, "bbox_list": [ [ 145.87, 269.89, 636.09, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cloth hanging off table at bottom of screen.", "normal_caption": "cloth hanging off table at bottom of screen", "solution": [ 145.87, 269.89, 637.09, 480.0 ], "normalized_solution": [ 227, 562, 995, 1000 ] }, { "height": 480, "width": 640, "id": 565, "original_id": 1966298, "dataset_name": "refcoco", "area": 25058.675000000007, "iscrowd": 0, "image_id": 565, "category_id": 67, "bbox_list": [ [ 145.87, 269.89, 636.09, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: tablecloth edge in the lower right corner.", "normal_caption": "tablecloth edge in the lower right corner", "solution": [ 145.87, 269.89, 637.09, 480.0 ], "normalized_solution": [ 227, 562, 995, 1000 ] }, { "height": 480, "width": 640, "id": 566, "original_id": 1966298, "dataset_name": "refcoco", "area": 25058.675000000007, "iscrowd": 0, "image_id": 566, "category_id": 67, "bbox_list": [ [ 145.87, 269.89, 636.09, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: table cloth hanging over edge.", "normal_caption": "table cloth hanging over edge", "solution": [ 145.87, 269.89, 637.09, 480.0 ], "normalized_solution": [ 227, 562, 995, 1000 ] }, { "height": 480, "width": 640, "id": 567, "original_id": 123565, "dataset_name": "refcoco", "area": 39027.66980000001, "iscrowd": 0, "image_id": 567, "category_id": 67, "bbox_list": [ [ 336.56, 231.53, 639.0, 473.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: table portion bottom right of phtot.", "normal_caption": "table portion bottom right of phtot", "solution": [ 336.56, 231.53, 640.0, 474.35 ], "normalized_solution": [ 525, 482, 1000, 988 ] }, { "height": 480, "width": 640, "id": 568, "original_id": 123565, "dataset_name": "refcoco", "area": 39027.66980000001, "iscrowd": 0, "image_id": 568, "category_id": 67, "bbox_list": [ [ 336.56, 231.53, 639.0, 473.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right most table.", "normal_caption": "right most table", "solution": [ 336.56, 231.53, 640.0, 474.35 ], "normalized_solution": [ 525, 482, 1000, 988 ] }, { "height": 480, "width": 640, "id": 569, "original_id": 1283931, "dataset_name": "refcoco", "area": 12426.324700000001, "iscrowd": 0, "image_id": 569, "category_id": 1, "bbox_list": [ [ 516.68, 136.65, 639.0, 302.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: old man blue shirt far right.", "normal_caption": "old man blue shirt far right", "solution": [ 516.68, 136.65, 640.0, 303.12 ], "normalized_solution": [ 807, 284, 1000, 631 ] }, { "height": 480, "width": 640, "id": 570, "original_id": 1283931, "dataset_name": "refcoco", "area": 12426.324700000001, "iscrowd": 0, "image_id": 570, "category_id": 1, "bbox_list": [ [ 516.68, 136.65, 639.0, 302.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on furthest right.", "normal_caption": "man on furthest right", "solution": [ 516.68, 136.65, 640.0, 303.12 ], "normalized_solution": [ 807, 284, 1000, 631 ] }, { "height": 480, "width": 640, "id": 571, "original_id": 1283931, "dataset_name": "refcoco", "area": 12426.324700000001, "iscrowd": 0, "image_id": 571, "category_id": 1, "bbox_list": [ [ 516.68, 136.65, 639.0, 302.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man far right in light colored shirt.", "normal_caption": "man far right in light colored shirt", "solution": [ 516.68, 136.65, 640.0, 303.12 ], "normalized_solution": [ 807, 284, 1000, 631 ] }, { "height": 480, "width": 640, "id": 572, "original_id": 1206873, "dataset_name": "refcoco", "area": 27879.778100000014, "iscrowd": 0, "image_id": 572, "category_id": 1, "bbox_list": [ [ 61.48, 200.63, 313.97, 438.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in checked shirt btw you were right on that last one.", "normal_caption": "man in checked shirt btw you were right on that last one", "solution": [ 61.48, 200.63, 314.97, 439.01 ], "normalized_solution": [ 96, 417, 492, 914 ] }, { "height": 480, "width": 640, "id": 573, "original_id": 1206873, "dataset_name": "refcoco", "area": 27879.778100000014, "iscrowd": 0, "image_id": 573, "category_id": 1, "bbox_list": [ [ 61.48, 200.63, 313.97, 438.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue and white gingham shirt left man.", "normal_caption": "blue and white gingham shirt left man", "solution": [ 61.48, 200.63, 314.97, 439.01 ], "normalized_solution": [ 96, 417, 492, 914 ] }, { "height": 480, "width": 640, "id": 574, "original_id": 1206873, "dataset_name": "refcoco", "area": 27879.778100000014, "iscrowd": 0, "image_id": 574, "category_id": 1, "bbox_list": [ [ 61.48, 200.63, 313.97, 438.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man close to us back to us.", "normal_caption": "man close to us back to us", "solution": [ 61.48, 200.63, 314.97, 439.01 ], "normalized_solution": [ 96, 417, 492, 914 ] }, { "height": 480, "width": 640, "id": 575, "original_id": 118586, "dataset_name": "refcoco", "area": 36422.24825000001, "iscrowd": 0, "image_id": 575, "category_id": 67, "bbox_list": [ [ 0.0, 139.5, 504.85, 350.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: main table spread on left side.", "normal_caption": "main table spread on left side", "solution": [ 0.0, 139.5, 505.85, 351.96 ], "normalized_solution": [ 0, 290, 790, 733 ] }, { "height": 480, "width": 640, "id": 576, "original_id": 118586, "dataset_name": "refcoco", "area": 36422.24825000001, "iscrowd": 0, "image_id": 576, "category_id": 67, "bbox_list": [ [ 0.0, 139.5, 504.85, 350.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: a table containing plates silver wear and cups.", "normal_caption": "a table containing plates silver wear and cups", "solution": [ 0.0, 139.5, 505.85, 351.96 ], "normalized_solution": [ 0, 290, 790, 733 ] }, { "height": 480, "width": 640, "id": 577, "original_id": 118586, "dataset_name": "refcoco", "area": 36422.24825000001, "iscrowd": 0, "image_id": 577, "category_id": 67, "bbox_list": [ [ 0.0, 139.5, 504.85, 350.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579329.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left table.", "normal_caption": "left table", "solution": [ 0.0, 139.5, 505.85, 351.96 ], "normalized_solution": [ 0, 290, 790, 733 ] }, { "height": 480, "width": 640, "id": 578, "original_id": 117084, "dataset_name": "refcoco", "area": 12611.0989, "iscrowd": 0, "image_id": 578, "category_id": 63, "bbox_list": [ [ 150.59, 213.69, 295.5, 364.5 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair facing away from the window.", "normal_caption": "chair facing away from the window", "solution": [ 150.59, 213.69, 296.5, 365.5 ], "normalized_solution": [ 235, 445, 463, 761 ] }, { "height": 480, "width": 640, "id": 579, "original_id": 117084, "dataset_name": "refcoco", "area": 12611.0989, "iscrowd": 0, "image_id": 579, "category_id": 63, "bbox_list": [ [ 150.59, 213.69, 295.5, 364.5 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair by the window.", "normal_caption": "chair by the window", "solution": [ 150.59, 213.69, 296.5, 365.5 ], "normalized_solution": [ 235, 445, 463, 761 ] }, { "height": 480, "width": 640, "id": 580, "original_id": 117084, "dataset_name": "refcoco", "area": 12611.0989, "iscrowd": 0, "image_id": 580, "category_id": 63, "bbox_list": [ [ 150.59, 213.69, 295.5, 364.5 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair in front of window.", "normal_caption": "chair in front of window", "solution": [ 150.59, 213.69, 296.5, 365.5 ], "normalized_solution": [ 235, 445, 463, 761 ] }, { "height": 480, "width": 640, "id": 581, "original_id": 107655, "dataset_name": "refcoco", "area": 11761.8387, "iscrowd": 0, "image_id": 581, "category_id": 62, "bbox_list": [ [ 156.23, 210.81, 297.07, 361.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair by window.", "normal_caption": "chair by window", "solution": [ 156.23, 210.81, 298.07, 362.93 ], "normalized_solution": [ 244, 439, 465, 756 ] }, { "height": 480, "width": 640, "id": 582, "original_id": 107655, "dataset_name": "refcoco", "area": 11761.8387, "iscrowd": 0, "image_id": 582, "category_id": 62, "bbox_list": [ [ 156.23, 210.81, 297.07, 361.93 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair in front window.", "normal_caption": "chair in front window", "solution": [ 156.23, 210.81, 298.07, 362.93 ], "normalized_solution": [ 244, 439, 465, 756 ] }, { "height": 480, "width": 640, "id": 583, "original_id": 105856, "dataset_name": "refcoco", "area": 29489.624949999998, "iscrowd": 0, "image_id": 583, "category_id": 62, "bbox_list": [ [ 342.71, 310.71, 612.16, 472.80999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair bottom right.", "normal_caption": "chair bottom right", "solution": [ 342.71, 310.71, 613.16, 473.81 ], "normalized_solution": [ 535, 647, 958, 987 ] }, { "height": 480, "width": 640, "id": 584, "original_id": 105856, "dataset_name": "refcoco", "area": 29489.624949999998, "iscrowd": 0, "image_id": 584, "category_id": 62, "bbox_list": [ [ 342.71, 310.71, 612.16, 472.80999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair bottom right.", "normal_caption": "chair bottom right", "solution": [ 342.71, 310.71, 613.16, 473.81 ], "normalized_solution": [ 535, 647, 958, 987 ] }, { "height": 480, "width": 640, "id": 585, "original_id": 105856, "dataset_name": "refcoco", "area": 29489.624949999998, "iscrowd": 0, "image_id": 585, "category_id": 62, "bbox_list": [ [ 342.71, 310.71, 612.16, 472.80999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579255.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: closest chair.", "normal_caption": "closest chair", "solution": [ 342.71, 310.71, 613.16, 473.81 ], "normalized_solution": [ 535, 647, 958, 987 ] }, { "height": 640, "width": 480, "id": 586, "original_id": 1930874, "dataset_name": "refcoco", "area": 42623.58065, "iscrowd": 0, "image_id": 586, "category_id": 62, "bbox_list": [ [ 1.66, 450.49, 261.65000000000003, 632.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579215.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front black seat.", "normal_caption": "front black seat", "solution": [ 1.66, 450.49, 262.65, 633.35 ], "normalized_solution": [ 3, 703, 547, 989 ] }, { "height": 640, "width": 480, "id": 587, "original_id": 1930874, "dataset_name": "refcoco", "area": 42623.58065, "iscrowd": 0, "image_id": 587, "category_id": 62, "bbox_list": [ [ 1.66, 450.49, 261.65000000000003, 632.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579215.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: seat foreground of picture on left.", "normal_caption": "seat foreground of picture on left", "solution": [ 1.66, 450.49, 262.65, 633.35 ], "normalized_solution": [ 3, 703, 547, 989 ] }, { "height": 640, "width": 480, "id": 588, "original_id": 1930874, "dataset_name": "refcoco", "area": 42623.58065, "iscrowd": 0, "image_id": 588, "category_id": 62, "bbox_list": [ [ 1.66, 450.49, 261.65000000000003, 632.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579215.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left black.", "normal_caption": "bottom left black", "solution": [ 1.66, 450.49, 262.65, 633.35 ], "normalized_solution": [ 3, 703, 547, 989 ] }, { "height": 640, "width": 480, "id": 589, "original_id": 100345, "dataset_name": "refcoco", "area": 58399.8298, "iscrowd": 0, "image_id": 589, "category_id": 62, "bbox_list": [ [ 293.16, 257.38, 469.71000000000004, 629.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579215.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: empty sit to the right of the guy.", "normal_caption": "empty sit to the right of the guy", "solution": [ 293.16, 257.38, 470.71, 630.37 ], "normalized_solution": [ 610, 402, 980, 984 ] }, { "height": 640, "width": 480, "id": 590, "original_id": 100345, "dataset_name": "refcoco", "area": 58399.8298, "iscrowd": 0, "image_id": 590, "category_id": 62, "bbox_list": [ [ 293.16, 257.38, 469.71000000000004, 629.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579215.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: empty seat on guys left.", "normal_caption": "empty seat on guys left", "solution": [ 293.16, 257.38, 470.71, 630.37 ], "normalized_solution": [ 610, 402, 980, 984 ] }, { "height": 640, "width": 480, "id": 591, "original_id": 100345, "dataset_name": "refcoco", "area": 58399.8298, "iscrowd": 0, "image_id": 591, "category_id": 62, "bbox_list": [ [ 293.16, 257.38, 469.71000000000004, 629.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579215.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: empty seat right.", "normal_caption": "empty seat right", "solution": [ 293.16, 257.38, 470.71, 630.37 ], "normalized_solution": [ 610, 402, 980, 984 ] }, { "height": 480, "width": 640, "id": 592, "original_id": 1463479, "dataset_name": "refcoco", "area": 27906.98795, "iscrowd": 0, "image_id": 592, "category_id": 38, "bbox_list": [ [ 293.21, 208.87, 483.53, 469.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579206.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: purple bear.", "normal_caption": "purple bear", "solution": [ 293.21, 208.87, 484.53, 470.38 ], "normalized_solution": [ 458, 435, 757, 979 ] }, { "height": 480, "width": 640, "id": 593, "original_id": 1463479, "dataset_name": "refcoco", "area": 27906.98795, "iscrowd": 0, "image_id": 593, "category_id": 38, "bbox_list": [ [ 293.21, 208.87, 483.53, 469.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579206.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bear.", "normal_caption": "bear", "solution": [ 293.21, 208.87, 484.53, 470.38 ], "normalized_solution": [ 458, 435, 757, 979 ] }, { "height": 480, "width": 640, "id": 594, "original_id": 1463479, "dataset_name": "refcoco", "area": 27906.98795, "iscrowd": 0, "image_id": 594, "category_id": 38, "bbox_list": [ [ 293.21, 208.87, 483.53, 469.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579206.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bear.", "normal_caption": "bear", "solution": [ 293.21, 208.87, 484.53, 470.38 ], "normalized_solution": [ 458, 435, 757, 979 ] }, { "height": 480, "width": 640, "id": 595, "original_id": 625622, "dataset_name": "refcoco", "area": 32336.377899999996, "iscrowd": 0, "image_id": 595, "category_id": 38, "bbox_list": [ [ 76.93, 1.08, 263.38, 324.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579206.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: striped kite on left.", "normal_caption": "striped kite on left", "solution": [ 76.93, 1.08, 264.38, 325.06 ], "normalized_solution": [ 120, 2, 413, 677 ] }, { "height": 480, "width": 640, "id": 596, "original_id": 625622, "dataset_name": "refcoco", "area": 32336.377899999996, "iscrowd": 0, "image_id": 596, "category_id": 38, "bbox_list": [ [ 76.93, 1.08, 263.38, 324.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579206.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black and white streamers.", "normal_caption": "black and white streamers", "solution": [ 76.93, 1.08, 264.38, 325.06 ], "normalized_solution": [ 120, 2, 413, 677 ] }, { "height": 480, "width": 640, "id": 597, "original_id": 625622, "dataset_name": "refcoco", "area": 32336.377899999996, "iscrowd": 0, "image_id": 597, "category_id": 38, "bbox_list": [ [ 76.93, 1.08, 263.38, 324.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579206.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left striped kite.", "normal_caption": "left striped kite", "solution": [ 76.93, 1.08, 264.38, 325.06 ], "normalized_solution": [ 120, 2, 413, 677 ] }, { "height": 510, "width": 640, "id": 598, "original_id": 114144, "dataset_name": "refcoco", "area": 27382.266349999987, "iscrowd": 0, "image_id": 598, "category_id": 63, "bbox_list": [ [ 0.0, 321.67, 212.87, 503.83000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579186.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: chair bottom left.", "normal_caption": "chair bottom left", "solution": [ 0.0, 321.67, 213.87, 504.83 ], "normalized_solution": [ 0, 630, 334, 989 ] }, { "height": 510, "width": 640, "id": 599, "original_id": 114144, "dataset_name": "refcoco", "area": 27382.266349999987, "iscrowd": 0, "image_id": 599, "category_id": 63, "bbox_list": [ [ 0.0, 321.67, 212.87, 503.83000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579186.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch on left bottom.", "normal_caption": "couch on left bottom", "solution": [ 0.0, 321.67, 213.87, 504.83 ], "normalized_solution": [ 0, 630, 334, 989 ] }, { "height": 510, "width": 640, "id": 600, "original_id": 114144, "dataset_name": "refcoco", "area": 27382.266349999987, "iscrowd": 0, "image_id": 600, "category_id": 63, "bbox_list": [ [ 0.0, 321.67, 212.87, 503.83000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579186.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch bottom left corner.", "normal_caption": "couch bottom left corner", "solution": [ 0.0, 321.67, 213.87, 504.83 ], "normalized_solution": [ 0, 630, 334, 989 ] }, { "height": 510, "width": 640, "id": 601, "original_id": 98921, "dataset_name": "refcoco", "area": 22517.034449999996, "iscrowd": 0, "image_id": 601, "category_id": 63, "bbox_list": [ [ 302.57, 224.75, 557.14, 359.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579186.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right sofa.", "normal_caption": "right sofa", "solution": [ 302.57, 224.75, 558.14, 360.79 ], "normalized_solution": [ 472, 440, 872, 707 ] }, { "height": 510, "width": 640, "id": 602, "original_id": 98921, "dataset_name": "refcoco", "area": 22517.034449999996, "iscrowd": 0, "image_id": 602, "category_id": 63, "bbox_list": [ [ 302.57, 224.75, 557.14, 359.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579186.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white couch at right.", "normal_caption": "white couch at right", "solution": [ 302.57, 224.75, 558.14, 360.79 ], "normalized_solution": [ 472, 440, 872, 707 ] }, { "height": 510, "width": 640, "id": 603, "original_id": 98921, "dataset_name": "refcoco", "area": 22517.034449999996, "iscrowd": 0, "image_id": 603, "category_id": 63, "bbox_list": [ [ 302.57, 224.75, 557.14, 359.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579186.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: full shown couch.", "normal_caption": "full shown couch", "solution": [ 302.57, 224.75, 558.14, 360.79 ], "normalized_solution": [ 472, 440, 872, 707 ] }, { "height": 512, "width": 640, "id": 604, "original_id": 1707513, "dataset_name": "refcoco", "area": 25426.830949999996, "iscrowd": 0, "image_id": 604, "category_id": 1, "bbox_list": [ [ 0.0, 72.93, 103.53, 483.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the guy all the way to the left.", "normal_caption": "the guy all the way to the left", "solution": [ 0.0, 72.93, 104.53, 484.49 ], "normalized_solution": [ 0, 142, 163, 946 ] }, { "height": 512, "width": 640, "id": 605, "original_id": 1707513, "dataset_name": "refcoco", "area": 25426.830949999996, "iscrowd": 0, "image_id": 605, "category_id": 1, "bbox_list": [ [ 0.0, 72.93, 103.53, 483.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left guy.", "normal_caption": "left guy", "solution": [ 0.0, 72.93, 104.53, 484.49 ], "normalized_solution": [ 0, 142, 163, 946 ] }, { "height": 512, "width": 640, "id": 606, "original_id": 1707513, "dataset_name": "refcoco", "area": 25426.830949999996, "iscrowd": 0, "image_id": 606, "category_id": 1, "bbox_list": [ [ 0.0, 72.93, 103.53, 483.49 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: ginger.", "normal_caption": "ginger", "solution": [ 0.0, 72.93, 104.53, 484.49 ], "normalized_solution": [ 0, 142, 163, 946 ] }, { "height": 512, "width": 640, "id": 607, "original_id": 554814, "dataset_name": "refcoco", "area": 58528.6314, "iscrowd": 0, "image_id": 607, "category_id": 1, "bbox_list": [ [ 407.32, 28.69, 627.67, 511.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: 15.", "normal_caption": "15", "solution": [ 407.32, 28.69, 628.67, 512.0 ], "normalized_solution": [ 636, 56, 982, 1000 ] }, { "height": 512, "width": 640, "id": 608, "original_id": 554814, "dataset_name": "refcoco", "area": 58528.6314, "iscrowd": 0, "image_id": 608, "category_id": 1, "bbox_list": [ [ 407.32, 28.69, 627.67, 511.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: number 15.", "normal_caption": "number 15", "solution": [ 407.32, 28.69, 628.67, 512.0 ], "normalized_solution": [ 636, 56, 982, 1000 ] }, { "height": 512, "width": 640, "id": 609, "original_id": 554814, "dataset_name": "refcoco", "area": 58528.6314, "iscrowd": 0, "image_id": 609, "category_id": 1, "bbox_list": [ [ 407.32, 28.69, 627.67, 511.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: 15.", "normal_caption": "15", "solution": [ 407.32, 28.69, 628.67, 512.0 ], "normalized_solution": [ 636, 56, 982, 1000 ] }, { "height": 512, "width": 640, "id": 610, "original_id": 456967, "dataset_name": "refcoco", "area": 25826.64785, "iscrowd": 0, "image_id": 610, "category_id": 1, "bbox_list": [ [ 311.1, 16.07, 476.56000000000006, 488.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue player on the right with arm up.", "normal_caption": "blue player on the right with arm up", "solution": [ 311.1, 16.07, 477.56, 489.04 ], "normalized_solution": [ 486, 31, 746, 955 ] }, { "height": 512, "width": 640, "id": 611, "original_id": 456967, "dataset_name": "refcoco", "area": 25826.64785, "iscrowd": 0, "image_id": 611, "category_id": 1, "bbox_list": [ [ 311.1, 16.07, 476.56000000000006, 488.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second from right with ball.", "normal_caption": "second from right with ball", "solution": [ 311.1, 16.07, 477.56, 489.04 ], "normalized_solution": [ 486, 31, 746, 955 ] }, { "height": 512, "width": 640, "id": 612, "original_id": 456967, "dataset_name": "refcoco", "area": 25826.64785, "iscrowd": 0, "image_id": 612, "category_id": 1, "bbox_list": [ [ 311.1, 16.07, 476.56000000000006, 488.04 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy kicking ball.", "normal_caption": "guy kicking ball", "solution": [ 311.1, 16.07, 477.56, 489.04 ], "normalized_solution": [ 486, 31, 746, 955 ] }, { "height": 512, "width": 640, "id": 613, "original_id": 453325, "dataset_name": "refcoco", "area": 42291.230999999985, "iscrowd": 0, "image_id": 613, "category_id": 1, "bbox_list": [ [ 39.12, 97.8, 374.08, 500.64 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white uniform left.", "normal_caption": "white uniform left", "solution": [ 39.12, 97.8, 375.08, 501.64 ], "normalized_solution": [ 61, 191, 586, 979 ] }, { "height": 512, "width": 640, "id": 614, "original_id": 453325, "dataset_name": "refcoco", "area": 42291.230999999985, "iscrowd": 0, "image_id": 614, "category_id": 1, "bbox_list": [ [ 39.12, 97.8, 374.08, 500.64 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man white shirt left.", "normal_caption": "man white shirt left", "solution": [ 39.12, 97.8, 375.08, 501.64 ], "normalized_solution": [ 61, 191, 586, 979 ] }, { "height": 512, "width": 640, "id": 615, "original_id": 453325, "dataset_name": "refcoco", "area": 42291.230999999985, "iscrowd": 0, "image_id": 615, "category_id": 1, "bbox_list": [ [ 39.12, 97.8, 374.08, 500.64 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579179.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: soccer player in white with visible face.", "normal_caption": "soccer player in white with visible face", "solution": [ 39.12, 97.8, 375.08, 501.64 ], "normalized_solution": [ 61, 191, 586, 979 ] }, { "height": 480, "width": 640, "id": 616, "original_id": 1901473, "dataset_name": "refcoco", "area": 67616.8238, "iscrowd": 0, "image_id": 616, "category_id": 51, "bbox_list": [ [ 0.0, 176.24, 301.64, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579165.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bowlspoon on the left with the white stuff in it.", "normal_caption": "bowlspoon on the left with the white stuff in it", "solution": [ 0.0, 176.24, 302.64, 480.0 ], "normalized_solution": [ 0, 367, 472, 1000 ] }, { "height": 480, "width": 640, "id": 617, "original_id": 1901473, "dataset_name": "refcoco", "area": 67616.8238, "iscrowd": 0, "image_id": 617, "category_id": 51, "bbox_list": [ [ 0.0, 176.24, 301.64, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579165.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left dish.", "normal_caption": "bottom left dish", "solution": [ 0.0, 176.24, 302.64, 480.0 ], "normalized_solution": [ 0, 367, 472, 1000 ] }, { "height": 480, "width": 640, "id": 618, "original_id": 1538645, "dataset_name": "refcoco", "area": 41361.606850000004, "iscrowd": 0, "image_id": 618, "category_id": 51, "bbox_list": [ [ 220.62, 29.05, 535.98, 213.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579165.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bowl with broccoli.", "normal_caption": "bowl with broccoli", "solution": [ 220.62, 29.05, 536.98, 214.65 ], "normalized_solution": [ 344, 60, 839, 447 ] }, { "height": 480, "width": 640, "id": 619, "original_id": 1538645, "dataset_name": "refcoco", "area": 41361.606850000004, "iscrowd": 0, "image_id": 619, "category_id": 51, "bbox_list": [ [ 220.62, 29.05, 535.98, 213.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579165.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bowl with broccli.", "normal_caption": "bowl with broccli", "solution": [ 220.62, 29.05, 536.98, 214.65 ], "normalized_solution": [ 344, 60, 839, 447 ] }, { "height": 480, "width": 640, "id": 620, "original_id": 1538645, "dataset_name": "refcoco", "area": 41361.606850000004, "iscrowd": 0, "image_id": 620, "category_id": 51, "bbox_list": [ [ 220.62, 29.05, 535.98, 213.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579165.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccoli bowl.", "normal_caption": "broccoli bowl", "solution": [ 220.62, 29.05, 536.98, 214.65 ], "normalized_solution": [ 344, 60, 839, 447 ] }, { "height": 375, "width": 500, "id": 621, "original_id": 278014, "dataset_name": "refcoco", "area": 21672.500250000012, "iscrowd": 0, "image_id": 621, "category_id": 21, "bbox_list": [ [ 42.63, 145.95, 298.38, 313.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579156.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left cow.", "normal_caption": "left cow", "solution": [ 42.63, 145.95, 299.38, 314.03 ], "normalized_solution": [ 85, 389, 598, 837 ] }, { "height": 375, "width": 500, "id": 622, "original_id": 278014, "dataset_name": "refcoco", "area": 21672.500250000012, "iscrowd": 0, "image_id": 622, "category_id": 21, "bbox_list": [ [ 42.63, 145.95, 298.38, 313.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579156.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow on left.", "normal_caption": "cow on left", "solution": [ 42.63, 145.95, 299.38, 314.03 ], "normalized_solution": [ 85, 389, 598, 837 ] }, { "height": 375, "width": 500, "id": 623, "original_id": 278014, "dataset_name": "refcoco", "area": 21672.500250000012, "iscrowd": 0, "image_id": 623, "category_id": 21, "bbox_list": [ [ 42.63, 145.95, 298.38, 313.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579156.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow on left.", "normal_caption": "cow on left", "solution": [ 42.63, 145.95, 299.38, 314.03 ], "normalized_solution": [ 85, 389, 598, 837 ] }, { "height": 375, "width": 500, "id": 624, "original_id": 71456, "dataset_name": "refcoco", "area": 14329.419500000004, "iscrowd": 0, "image_id": 624, "category_id": 21, "bbox_list": [ [ 402.42, 140.32, 499.0, 341.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579156.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cow on the far right.", "normal_caption": "cow on the far right", "solution": [ 402.42, 140.32, 500.0, 342.74 ], "normalized_solution": [ 804, 374, 1000, 913 ] }, { "height": 375, "width": 500, "id": 625, "original_id": 71456, "dataset_name": "refcoco", "area": 14329.419500000004, "iscrowd": 0, "image_id": 625, "category_id": 21, "bbox_list": [ [ 402.42, 140.32, 499.0, 341.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579156.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right most cow.", "normal_caption": "right most cow", "solution": [ 402.42, 140.32, 500.0, 342.74 ], "normalized_solution": [ 804, 374, 1000, 913 ] }, { "height": 375, "width": 500, "id": 626, "original_id": 71456, "dataset_name": "refcoco", "area": 14329.419500000004, "iscrowd": 0, "image_id": 626, "category_id": 21, "bbox_list": [ [ 402.42, 140.32, 499.0, 341.74 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579156.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right cow.", "normal_caption": "far right cow", "solution": [ 402.42, 140.32, 500.0, 342.74 ], "normalized_solution": [ 804, 374, 1000, 913 ] }, { "height": 500, "width": 333, "id": 627, "original_id": 515589, "dataset_name": "refcoco", "area": 28702.995700000003, "iscrowd": 0, "image_id": 627, "category_id": 1, "bbox_list": [ [ 4.49, 141.39, 146.19, 492.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579145.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy.", "normal_caption": "guy", "solution": [ 4.49, 141.39, 147.19, 493.07 ], "normalized_solution": [ 13, 282, 442, 986 ] }, { "height": 500, "width": 333, "id": 628, "original_id": 515589, "dataset_name": "refcoco", "area": 28702.995700000003, "iscrowd": 0, "image_id": 628, "category_id": 1, "bbox_list": [ [ 4.49, 141.39, 146.19, 492.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579145.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid on left.", "normal_caption": "kid on left", "solution": [ 4.49, 141.39, 147.19, 493.07 ], "normalized_solution": [ 13, 282, 442, 986 ] }, { "height": 500, "width": 333, "id": 629, "original_id": 515589, "dataset_name": "refcoco", "area": 28702.995700000003, "iscrowd": 0, "image_id": 629, "category_id": 1, "bbox_list": [ [ 4.49, 141.39, 146.19, 492.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579145.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: number 9.", "normal_caption": "number 9", "solution": [ 4.49, 141.39, 147.19, 493.07 ], "normalized_solution": [ 13, 282, 442, 986 ] }, { "height": 500, "width": 333, "id": 630, "original_id": 479698, "dataset_name": "refcoco", "area": 34492.97555, "iscrowd": 0, "image_id": 630, "category_id": 1, "bbox_list": [ [ 98.88, 207.87, 328.21000000000004, 491.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579145.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 98.88, 207.87, 329.21, 492.13 ], "normalized_solution": [ 296, 415, 988, 984 ] }, { "height": 500, "width": 333, "id": 631, "original_id": 479698, "dataset_name": "refcoco", "area": 34492.97555, "iscrowd": 0, "image_id": 631, "category_id": 1, "bbox_list": [ [ 98.88, 207.87, 328.21000000000004, 491.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579145.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in red shirt.", "normal_caption": "woman in red shirt", "solution": [ 98.88, 207.87, 329.21, 492.13 ], "normalized_solution": [ 296, 415, 988, 984 ] }, { "height": 500, "width": 333, "id": 632, "original_id": 479698, "dataset_name": "refcoco", "area": 34492.97555, "iscrowd": 0, "image_id": 632, "category_id": 1, "bbox_list": [ [ 98.88, 207.87, 328.21000000000004, 491.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579145.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady red.", "normal_caption": "lady red", "solution": [ 98.88, 207.87, 329.21, 492.13 ], "normalized_solution": [ 296, 415, 988, 984 ] }, { "height": 462, "width": 600, "id": 633, "original_id": 457633, "dataset_name": "refcoco", "area": 90720.44099999998, "iscrowd": 0, "image_id": 633, "category_id": 1, "bbox_list": [ [ 1.04, 1.04, 340.3, 429.78000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579138.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on left.", "normal_caption": "man on left", "solution": [ 1.04, 1.04, 341.3, 430.78 ], "normalized_solution": [ 1, 2, 568, 932 ] }, { "height": 462, "width": 600, "id": 634, "original_id": 457633, "dataset_name": "refcoco", "area": 90720.44099999998, "iscrowd": 0, "image_id": 634, "category_id": 1, "bbox_list": [ [ 1.04, 1.04, 340.3, 429.78000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579138.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on the left.", "normal_caption": "man on the left", "solution": [ 1.04, 1.04, 341.3, 430.78 ], "normalized_solution": [ 1, 2, 568, 932 ] }, { "height": 462, "width": 600, "id": 635, "original_id": 457633, "dataset_name": "refcoco", "area": 90720.44099999998, "iscrowd": 0, "image_id": 635, "category_id": 1, "bbox_list": [ [ 1.04, 1.04, 340.3, 429.78000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579138.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left man sorry.", "normal_caption": "left man sorry", "solution": [ 1.04, 1.04, 341.3, 430.78 ], "normalized_solution": [ 1, 2, 568, 932 ] }, { "height": 462, "width": 600, "id": 636, "original_id": 440025, "dataset_name": "refcoco", "area": 59938.376200000035, "iscrowd": 0, "image_id": 636, "category_id": 1, "bbox_list": [ [ 337.14, 41.62, 599.0, 454.76 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579138.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on right.", "normal_caption": "man on right", "solution": [ 337.14, 41.62, 600.0, 455.76 ], "normalized_solution": [ 561, 90, 1000, 986 ] }, { "height": 462, "width": 600, "id": 637, "original_id": 440025, "dataset_name": "refcoco", "area": 59938.376200000035, "iscrowd": 0, "image_id": 637, "category_id": 1, "bbox_list": [ [ 337.14, 41.62, 599.0, 454.76 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579138.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right guy.", "normal_caption": "right guy", "solution": [ 337.14, 41.62, 600.0, 455.76 ], "normalized_solution": [ 561, 90, 1000, 986 ] }, { "height": 480, "width": 640, "id": 638, "original_id": 519612, "dataset_name": "refcoco", "area": 14036.34455, "iscrowd": 0, "image_id": 638, "category_id": 1, "bbox_list": [ [ 386.16, 115.42, 516.75, 329.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in the back.", "normal_caption": "guy in the back", "solution": [ 386.16, 115.42, 517.75, 330.07 ], "normalized_solution": [ 603, 240, 808, 687 ] }, { "height": 480, "width": 640, "id": 639, "original_id": 519612, "dataset_name": "refcoco", "area": 14036.34455, "iscrowd": 0, "image_id": 639, "category_id": 1, "bbox_list": [ [ 386.16, 115.42, 516.75, 329.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on right.", "normal_caption": "guy on right", "solution": [ 386.16, 115.42, 517.75, 330.07 ], "normalized_solution": [ 603, 240, 808, 687 ] }, { "height": 480, "width": 640, "id": 640, "original_id": 519612, "dataset_name": "refcoco", "area": 14036.34455, "iscrowd": 0, "image_id": 640, "category_id": 1, "bbox_list": [ [ 386.16, 115.42, 516.75, 329.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right dude.", "normal_caption": "right dude", "solution": [ 386.16, 115.42, 517.75, 330.07 ], "normalized_solution": [ 603, 240, 808, 687 ] }, { "height": 480, "width": 640, "id": 641, "original_id": 497695, "dataset_name": "refcoco", "area": 19852.076350000007, "iscrowd": 0, "image_id": 641, "category_id": 1, "bbox_list": [ [ 159.28, 100.81, 304.65, 414.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman skier.", "normal_caption": "woman skier", "solution": [ 159.28, 100.81, 305.65, 415.07 ], "normalized_solution": [ 248, 210, 477, 864 ] }, { "height": 480, "width": 640, "id": 642, "original_id": 497695, "dataset_name": "refcoco", "area": 19852.076350000007, "iscrowd": 0, "image_id": 642, "category_id": 1, "bbox_list": [ [ 159.28, 100.81, 304.65, 414.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red sleeved.", "normal_caption": "red sleeved", "solution": [ 159.28, 100.81, 305.65, 415.07 ], "normalized_solution": [ 248, 210, 477, 864 ] }, { "height": 480, "width": 640, "id": 643, "original_id": 497695, "dataset_name": "refcoco", "area": 19852.076350000007, "iscrowd": 0, "image_id": 643, "category_id": 1, "bbox_list": [ [ 159.28, 100.81, 304.65, 414.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579136.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person front blue.", "normal_caption": "person front blue", "solution": [ 159.28, 100.81, 305.65, 415.07 ], "normalized_solution": [ 248, 210, 477, 864 ] }, { "height": 640, "width": 480, "id": 644, "original_id": 519688, "dataset_name": "refcoco", "area": 19347.000099999997, "iscrowd": 0, "image_id": 644, "category_id": 1, "bbox_list": [ [ 308.52, 370.22, 479.0, 630.3900000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579051.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: armhand bottom right.", "normal_caption": "armhand bottom right", "solution": [ 308.52, 370.22, 480.0, 631.39 ], "normalized_solution": [ 642, 578, 1000, 986 ] }, { "height": 640, "width": 480, "id": 645, "original_id": 519688, "dataset_name": "refcoco", "area": 19347.000099999997, "iscrowd": 0, "image_id": 645, "category_id": 1, "bbox_list": [ [ 308.52, 370.22, 479.0, 630.3900000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579051.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: big hand.", "normal_caption": "big hand", "solution": [ 308.52, 370.22, 480.0, 631.39 ], "normalized_solution": [ 642, 578, 1000, 986 ] }, { "height": 640, "width": 480, "id": 646, "original_id": 519688, "dataset_name": "refcoco", "area": 19347.000099999997, "iscrowd": 0, "image_id": 646, "category_id": 1, "bbox_list": [ [ 308.52, 370.22, 479.0, 630.3900000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579051.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: adults arm.", "normal_caption": "adults arm", "solution": [ 308.52, 370.22, 480.0, 631.39 ], "normalized_solution": [ 642, 578, 1000, 986 ] }, { "height": 640, "width": 480, "id": 647, "original_id": 511700, "dataset_name": "refcoco", "area": 35178.40745, "iscrowd": 0, "image_id": 647, "category_id": 1, "bbox_list": [ [ 288.75, 100.98, 434.61, 621.8000000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579051.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: ki.", "normal_caption": "ki", "solution": [ 288.75, 100.98, 435.61, 622.8 ], "normalized_solution": [ 601, 157, 907, 973 ] }, { "height": 640, "width": 480, "id": 648, "original_id": 511700, "dataset_name": "refcoco", "area": 35178.40745, "iscrowd": 0, "image_id": 648, "category_id": 1, "bbox_list": [ [ 288.75, 100.98, 434.61, 621.8000000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579051.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 288.75, 100.98, 435.61, 622.8 ], "normalized_solution": [ 601, 157, 907, 973 ] }, { "height": 640, "width": 480, "id": 649, "original_id": 511700, "dataset_name": "refcoco", "area": 35178.40745, "iscrowd": 0, "image_id": 649, "category_id": 1, "bbox_list": [ [ 288.75, 100.98, 434.61, 621.8000000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000579051.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: child standing.", "normal_caption": "child standing", "solution": [ 288.75, 100.98, 435.61, 622.8 ], "normalized_solution": [ 601, 157, 907, 973 ] }, { "height": 427, "width": 640, "id": 650, "original_id": 2186326, "dataset_name": "refcoco", "area": 10371.07035, "iscrowd": 0, "image_id": 650, "category_id": 52, "bbox_list": [ [ 110.34, 76.24, 229.60000000000002, 195.5 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left banana piece.", "normal_caption": "top left banana piece", "solution": [ 110.34, 76.24, 230.6, 196.5 ], "normalized_solution": [ 172, 178, 360, 460 ] }, { "height": 427, "width": 640, "id": 651, "original_id": 2186326, "dataset_name": "refcoco", "area": 10371.07035, "iscrowd": 0, "image_id": 651, "category_id": 52, "bbox_list": [ [ 110.34, 76.24, 229.60000000000002, 195.5 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: banana upper left.", "normal_caption": "banana upper left", "solution": [ 110.34, 76.24, 230.6, 196.5 ], "normalized_solution": [ 172, 178, 360, 460 ] }, { "height": 427, "width": 640, "id": 652, "original_id": 1545499, "dataset_name": "refcoco", "area": 15247.83865, "iscrowd": 0, "image_id": 652, "category_id": 52, "bbox_list": [ [ 418.52, 129.03, 589.9, 296.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: just avove.", "normal_caption": "just avove", "solution": [ 418.52, 129.03, 590.9, 297.32 ], "normalized_solution": [ 653, 302, 923, 696 ] }, { "height": 427, "width": 640, "id": 653, "original_id": 1545499, "dataset_name": "refcoco", "area": 15247.83865, "iscrowd": 0, "image_id": 653, "category_id": 52, "bbox_list": [ [ 418.52, 129.03, 589.9, 296.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: yes.", "normal_caption": "yes", "solution": [ 418.52, 129.03, 590.9, 297.32 ], "normalized_solution": [ 653, 302, 923, 696 ] }, { "height": 427, "width": 640, "id": 654, "original_id": 1544097, "dataset_name": "refcoco", "area": 18485.475950000004, "iscrowd": 0, "image_id": 654, "category_id": 52, "bbox_list": [ [ 52.78, 177.52, 539.23, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: dumpling in front on right.", "normal_caption": "dumpling in front on right", "solution": [ 52.78, 177.52, 540.23, 427.0 ], "normalized_solution": [ 82, 415, 844, 1000 ] }, { "height": 427, "width": 640, "id": 655, "original_id": 1544097, "dataset_name": "refcoco", "area": 18485.475950000004, "iscrowd": 0, "image_id": 655, "category_id": 52, "bbox_list": [ [ 52.78, 177.52, 539.23, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: banana big piece lower right.", "normal_caption": "banana big piece lower right", "solution": [ 52.78, 177.52, 540.23, 427.0 ], "normalized_solution": [ 82, 415, 844, 1000 ] }, { "height": 427, "width": 640, "id": 656, "original_id": 1544097, "dataset_name": "refcoco", "area": 18485.475950000004, "iscrowd": 0, "image_id": 656, "category_id": 52, "bbox_list": [ [ 52.78, 177.52, 539.23, 426.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578950.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front to the right yellow.", "normal_caption": "front to the right yellow", "solution": [ 52.78, 177.52, 540.23, 427.0 ], "normalized_solution": [ 82, 415, 844, 1000 ] }, { "height": 640, "width": 480, "id": 657, "original_id": 1611757, "dataset_name": "refcoco", "area": 26461.836, "iscrowd": 0, "image_id": 657, "category_id": 65, "bbox_list": [ [ 356.67, 279.01, 479.0, 636.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578924.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue right of arm.", "normal_caption": "blue right of arm", "solution": [ 356.67, 279.01, 480.0, 637.12 ], "normalized_solution": [ 743, 435, 1000, 995 ] }, { "height": 640, "width": 480, "id": 658, "original_id": 1611757, "dataset_name": "refcoco", "area": 26461.836, "iscrowd": 0, "image_id": 658, "category_id": 65, "bbox_list": [ [ 356.67, 279.01, 479.0, 636.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578924.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the blue blanket to the right of the kids arm.", "normal_caption": "the blue blanket to the right of the kids arm", "solution": [ 356.67, 279.01, 480.0, 637.12 ], "normalized_solution": [ 743, 435, 1000, 995 ] }, { "height": 640, "width": 480, "id": 659, "original_id": 1611757, "dataset_name": "refcoco", "area": 26461.836, "iscrowd": 0, "image_id": 659, "category_id": 65, "bbox_list": [ [ 356.67, 279.01, 479.0, 636.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578924.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right bottom.", "normal_caption": "far right bottom", "solution": [ 356.67, 279.01, 480.0, 637.12 ], "normalized_solution": [ 743, 435, 1000, 995 ] }, { "height": 640, "width": 480, "id": 660, "original_id": 317075, "dataset_name": "refcoco", "area": 108080.7093, "iscrowd": 0, "image_id": 660, "category_id": 65, "bbox_list": [ [ 2.88, 2.88, 479.0, 324.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578924.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: anywhee quilttop.", "normal_caption": "anywhee quilttop", "solution": [ 2.88, 2.88, 480.0, 325.03 ], "normalized_solution": [ 6, 4, 1000, 507 ] }, { "height": 640, "width": 480, "id": 661, "original_id": 317075, "dataset_name": "refcoco", "area": 108080.7093, "iscrowd": 0, "image_id": 661, "category_id": 65, "bbox_list": [ [ 2.88, 2.88, 479.0, 324.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578924.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blanket in top part of pic.", "normal_caption": "blanket in top part of pic", "solution": [ 2.88, 2.88, 480.0, 325.03 ], "normalized_solution": [ 6, 4, 1000, 507 ] }, { "height": 640, "width": 480, "id": 662, "original_id": 317075, "dataset_name": "refcoco", "area": 108080.7093, "iscrowd": 0, "image_id": 662, "category_id": 65, "bbox_list": [ [ 2.88, 2.88, 479.0, 324.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578924.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: quilt.", "normal_caption": "quilt", "solution": [ 2.88, 2.88, 480.0, 325.03 ], "normalized_solution": [ 6, 4, 1000, 507 ] }, { "height": 640, "width": 463, "id": 663, "original_id": 167200, "dataset_name": "refcoco", "area": 44333.06844999999, "iscrowd": 0, "image_id": 663, "category_id": 6, "bbox_list": [ [ 322.16, 172.58, 462.0, 608.8000000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578884.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: vehicle with 19 on it.", "normal_caption": "vehicle with 19 on it", "solution": [ 322.16, 172.58, 463.0, 609.8 ], "normalized_solution": [ 695, 269, 1000, 952 ] }, { "height": 640, "width": 463, "id": 664, "original_id": 167200, "dataset_name": "refcoco", "area": 44333.06844999999, "iscrowd": 0, "image_id": 664, "category_id": 6, "bbox_list": [ [ 322.16, 172.58, 462.0, 608.8000000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578884.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: 19 blue.", "normal_caption": "19 blue", "solution": [ 322.16, 172.58, 463.0, 609.8 ], "normalized_solution": [ 695, 269, 1000, 952 ] }, { "height": 640, "width": 463, "id": 665, "original_id": 167200, "dataset_name": "refcoco", "area": 44333.06844999999, "iscrowd": 0, "image_id": 665, "category_id": 6, "bbox_list": [ [ 322.16, 172.58, 462.0, 608.8000000000001 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578884.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: 19.", "normal_caption": "19", "solution": [ 322.16, 172.58, 463.0, 609.8 ], "normalized_solution": [ 695, 269, 1000, 952 ] }, { "height": 640, "width": 463, "id": 666, "original_id": 165007, "dataset_name": "refcoco", "area": 14111.340500000002, "iscrowd": 0, "image_id": 666, "category_id": 6, "bbox_list": [ [ 116.1, 251.04, 246.04, 444.54999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578884.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: read doubledecker bus.", "normal_caption": "read doubledecker bus", "solution": [ 116.1, 251.04, 247.04, 445.55 ], "normalized_solution": [ 250, 392, 533, 696 ] }, { "height": 640, "width": 463, "id": 667, "original_id": 165007, "dataset_name": "refcoco", "area": 14111.340500000002, "iscrowd": 0, "image_id": 667, "category_id": 6, "bbox_list": [ [ 116.1, 251.04, 246.04, 444.54999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578884.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red bus.", "normal_caption": "red bus", "solution": [ 116.1, 251.04, 247.04, 445.55 ], "normalized_solution": [ 250, 392, 533, 696 ] }, { "height": 640, "width": 463, "id": 668, "original_id": 165007, "dataset_name": "refcoco", "area": 14111.340500000002, "iscrowd": 0, "image_id": 668, "category_id": 6, "bbox_list": [ [ 116.1, 251.04, 246.04, 444.54999999999995 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578884.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: back left red bus.", "normal_caption": "back left red bus", "solution": [ 116.1, 251.04, 247.04, 445.55 ], "normalized_solution": [ 250, 392, 533, 696 ] }, { "height": 480, "width": 251, "id": 669, "original_id": 597165, "dataset_name": "refcoco", "area": 10808.198950000004, "iscrowd": 0, "image_id": 669, "category_id": 25, "bbox_list": [ [ 56.65, 9.9, 169.28, 255.58999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578875.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the giraffe that is holding on.", "normal_caption": "the giraffe that is holding on", "solution": [ 56.65, 9.9, 170.28, 256.59 ], "normalized_solution": [ 225, 20, 678, 534 ] }, { "height": 480, "width": 251, "id": 670, "original_id": 597165, "dataset_name": "refcoco", "area": 10808.198950000004, "iscrowd": 0, "image_id": 670, "category_id": 25, "bbox_list": [ [ 56.65, 9.9, 169.28, 255.58999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578875.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top giraffe lol.", "normal_caption": "top giraffe lol", "solution": [ 56.65, 9.9, 170.28, 256.59 ], "normalized_solution": [ 225, 20, 678, 534 ] }, { "height": 480, "width": 251, "id": 671, "original_id": 597165, "dataset_name": "refcoco", "area": 10808.198950000004, "iscrowd": 0, "image_id": 671, "category_id": 25, "bbox_list": [ [ 56.65, 9.9, 169.28, 255.58999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578875.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girraffe riding.", "normal_caption": "girraffe riding", "solution": [ 56.65, 9.9, 170.28, 256.59 ], "normalized_solution": [ 225, 20, 678, 534 ] }, { "height": 480, "width": 251, "id": 672, "original_id": 596775, "dataset_name": "refcoco", "area": 25313.623749999995, "iscrowd": 0, "image_id": 672, "category_id": 25, "bbox_list": [ [ 3.83, 61.75, 244.05, 460.82 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578875.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: momma giraffe.", "normal_caption": "momma giraffe", "solution": [ 3.83, 61.75, 245.05, 461.82 ], "normalized_solution": [ 15, 128, 976, 962 ] }, { "height": 480, "width": 251, "id": 673, "original_id": 596775, "dataset_name": "refcoco", "area": 25313.623749999995, "iscrowd": 0, "image_id": 673, "category_id": 25, "bbox_list": [ [ 3.83, 61.75, 244.05, 460.82 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578875.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: frt.", "normal_caption": "frt", "solution": [ 3.83, 61.75, 245.05, 461.82 ], "normalized_solution": [ 15, 128, 976, 962 ] }, { "height": 480, "width": 251, "id": 674, "original_id": 596775, "dataset_name": "refcoco", "area": 25313.623749999995, "iscrowd": 0, "image_id": 674, "category_id": 25, "bbox_list": [ [ 3.83, 61.75, 244.05, 460.82 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578875.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom giraffe.", "normal_caption": "bottom giraffe", "solution": [ 3.83, 61.75, 245.05, 461.82 ], "normalized_solution": [ 15, 128, 976, 962 ] }, { "height": 427, "width": 640, "id": 675, "original_id": 544253, "dataset_name": "refcoco", "area": 10068.628700000005, "iscrowd": 0, "image_id": 675, "category_id": 1, "bbox_list": [ [ 382.86, 171.76, 439.12, 418.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578841.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl with pink hat and white gloves.", "normal_caption": "girl with pink hat and white gloves", "solution": [ 382.86, 171.76, 440.12, 419.32 ], "normalized_solution": [ 598, 402, 687, 982 ] }, { "height": 427, "width": 640, "id": 676, "original_id": 544253, "dataset_name": "refcoco", "area": 10068.628700000005, "iscrowd": 0, "image_id": 676, "category_id": 1, "bbox_list": [ [ 382.86, 171.76, 439.12, 418.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578841.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid in blue.", "normal_caption": "kid in blue", "solution": [ 382.86, 171.76, 440.12, 419.32 ], "normalized_solution": [ 598, 402, 687, 982 ] }, { "height": 427, "width": 640, "id": 677, "original_id": 493487, "dataset_name": "refcoco", "area": 18564.354699999993, "iscrowd": 0, "image_id": 677, "category_id": 1, "bbox_list": [ [ 190.95, 95.96, 280.15, 419.28 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578841.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in baby blue.", "normal_caption": "woman in baby blue", "solution": [ 190.95, 95.96, 281.15, 420.28 ], "normalized_solution": [ 298, 224, 439, 984 ] }, { "height": 427, "width": 640, "id": 678, "original_id": 493487, "dataset_name": "refcoco", "area": 18564.354699999993, "iscrowd": 0, "image_id": 678, "category_id": 1, "bbox_list": [ [ 190.95, 95.96, 280.15, 419.28 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578841.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman left.", "normal_caption": "woman left", "solution": [ 190.95, 95.96, 281.15, 420.28 ], "normalized_solution": [ 298, 224, 439, 984 ] }, { "height": 427, "width": 640, "id": 679, "original_id": 493487, "dataset_name": "refcoco", "area": 18564.354699999993, "iscrowd": 0, "image_id": 679, "category_id": 1, "bbox_list": [ [ 190.95, 95.96, 280.15, 419.28 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578841.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on left.", "normal_caption": "person on left", "solution": [ 190.95, 95.96, 281.15, 420.28 ], "normalized_solution": [ 298, 224, 439, 984 ] }, { "height": 640, "width": 595, "id": 680, "original_id": 2158908, "dataset_name": "refcoco", "area": 15567.20665, "iscrowd": 0, "image_id": 680, "category_id": 1, "bbox_list": [ [ 438.8, 1.99, 541.1700000000001, 273.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: catcher in background right.", "normal_caption": "catcher in background right", "solution": [ 438.8, 1.99, 542.17, 274.2 ], "normalized_solution": [ 737, 3, 911, 428 ] }, { "height": 640, "width": 595, "id": 681, "original_id": 2158908, "dataset_name": "refcoco", "area": 15567.20665, "iscrowd": 0, "image_id": 681, "category_id": 1, "bbox_list": [ [ 438.8, 1.99, 541.1700000000001, 273.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy top right of kid.", "normal_caption": "guy top right of kid", "solution": [ 438.8, 1.99, 542.17, 274.2 ], "normalized_solution": [ 737, 3, 911, 428 ] }, { "height": 640, "width": 595, "id": 682, "original_id": 2158908, "dataset_name": "refcoco", "area": 15567.20665, "iscrowd": 0, "image_id": 682, "category_id": 1, "bbox_list": [ [ 438.8, 1.99, 541.1700000000001, 273.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy with glove top right behind kids right shoulder.", "normal_caption": "guy with glove top right behind kids right shoulder", "solution": [ 438.8, 1.99, 542.17, 274.2 ], "normalized_solution": [ 737, 3, 911, 428 ] }, { "height": 640, "width": 595, "id": 683, "original_id": 2002580, "dataset_name": "refcoco", "area": 13564.05295, "iscrowd": 0, "image_id": 683, "category_id": 1, "bbox_list": [ [ 226.08, 0.0, 344.77, 316.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: referee.", "normal_caption": "referee", "solution": [ 226.08, 0.0, 345.77, 317.51 ], "normalized_solution": [ 379, 0, 581, 496 ] }, { "height": 640, "width": 595, "id": 684, "original_id": 2002580, "dataset_name": "refcoco", "area": 13564.05295, "iscrowd": 0, "image_id": 684, "category_id": 1, "bbox_list": [ [ 226.08, 0.0, 344.77, 316.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: umpire.", "normal_caption": "umpire", "solution": [ 226.08, 0.0, 345.77, 317.51 ], "normalized_solution": [ 379, 0, 581, 496 ] }, { "height": 640, "width": 595, "id": 685, "original_id": 2002580, "dataset_name": "refcoco", "area": 13564.05295, "iscrowd": 0, "image_id": 685, "category_id": 1, "bbox_list": [ [ 226.08, 0.0, 344.77, 316.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in background gray shirt.", "normal_caption": "guy in background gray shirt", "solution": [ 226.08, 0.0, 345.77, 317.51 ], "normalized_solution": [ 379, 0, 581, 496 ] }, { "height": 640, "width": 595, "id": 686, "original_id": 445162, "dataset_name": "refcoco", "area": 71667.0893, "iscrowd": 0, "image_id": 686, "category_id": 1, "bbox_list": [ [ 223.86, 40.35, 502.68, 607.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid.", "normal_caption": "kid", "solution": [ 223.86, 40.35, 503.68, 608.6 ], "normalized_solution": [ 376, 63, 846, 950 ] }, { "height": 640, "width": 595, "id": 687, "original_id": 445162, "dataset_name": "refcoco", "area": 71667.0893, "iscrowd": 0, "image_id": 687, "category_id": 1, "bbox_list": [ [ 223.86, 40.35, 502.68, 607.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the boy in blue.", "normal_caption": "the boy in blue", "solution": [ 223.86, 40.35, 503.68, 608.6 ], "normalized_solution": [ 376, 63, 846, 950 ] }, { "height": 640, "width": 595, "id": 688, "original_id": 445162, "dataset_name": "refcoco", "area": 71667.0893, "iscrowd": 0, "image_id": 688, "category_id": 1, "bbox_list": [ [ 223.86, 40.35, 502.68, 607.6 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578766.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: child with the bat.", "normal_caption": "child with the bat", "solution": [ 223.86, 40.35, 503.68, 608.6 ], "normalized_solution": [ 376, 63, 846, 950 ] }, { "height": 640, "width": 512, "id": 689, "original_id": 1734399, "dataset_name": "refcoco", "area": 12578.570800000005, "iscrowd": 0, "image_id": 689, "category_id": 1, "bbox_list": [ [ 390.59, 278.83, 511.0, 487.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand just above the womens hand on right.", "normal_caption": "hand just above the womens hand on right", "solution": [ 390.59, 278.83, 512.0, 488.39 ], "normalized_solution": [ 762, 435, 1000, 763 ] }, { "height": 640, "width": 512, "id": 690, "original_id": 1734399, "dataset_name": "refcoco", "area": 12578.570800000005, "iscrowd": 0, "image_id": 690, "category_id": 1, "bbox_list": [ [ 390.59, 278.83, 511.0, 487.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right top hands.", "normal_caption": "right top hands", "solution": [ 390.59, 278.83, 512.0, 488.39 ], "normalized_solution": [ 762, 435, 1000, 763 ] }, { "height": 640, "width": 512, "id": 691, "original_id": 494900, "dataset_name": "refcoco", "area": 57008.34555, "iscrowd": 0, "image_id": 691, "category_id": 1, "bbox_list": [ [ 132.79, 301.64, 436.6, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink shirt.", "normal_caption": "pink shirt", "solution": [ 132.79, 301.64, 437.6, 640.0 ], "normalized_solution": [ 259, 471, 854, 1000 ] }, { "height": 640, "width": 512, "id": 692, "original_id": 494900, "dataset_name": "refcoco", "area": 57008.34555, "iscrowd": 0, "image_id": 692, "category_id": 1, "bbox_list": [ [ 132.79, 301.64, 436.6, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink shirt.", "normal_caption": "pink shirt", "solution": [ 132.79, 301.64, 437.6, 640.0 ], "normalized_solution": [ 259, 471, 854, 1000 ] }, { "height": 640, "width": 512, "id": 693, "original_id": 493289, "dataset_name": "refcoco", "area": 27292.988900000008, "iscrowd": 0, "image_id": 693, "category_id": 1, "bbox_list": [ [ 264.63, 316.5, 508.12, 631.9 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: first arm closest to us.", "normal_caption": "first arm closest to us", "solution": [ 264.63, 316.5, 509.12, 632.9 ], "normalized_solution": [ 516, 494, 994, 988 ] }, { "height": 640, "width": 512, "id": 694, "original_id": 493289, "dataset_name": "refcoco", "area": 27292.988900000008, "iscrowd": 0, "image_id": 694, "category_id": 1, "bbox_list": [ [ 264.63, 316.5, 508.12, 631.9 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand in front.", "normal_caption": "hand in front", "solution": [ 264.63, 316.5, 509.12, 632.9 ], "normalized_solution": [ 516, 494, 994, 988 ] }, { "height": 640, "width": 512, "id": 695, "original_id": 493289, "dataset_name": "refcoco", "area": 27292.988900000008, "iscrowd": 0, "image_id": 695, "category_id": 1, "bbox_list": [ [ 264.63, 316.5, 508.12, 631.9 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front arm covering woman in pink.", "normal_caption": "front arm covering woman in pink", "solution": [ 264.63, 316.5, 509.12, 632.9 ], "normalized_solution": [ 516, 494, 994, 988 ] }, { "height": 640, "width": 512, "id": 696, "original_id": 480123, "dataset_name": "refcoco", "area": 27502.088949999998, "iscrowd": 0, "image_id": 696, "category_id": 1, "bbox_list": [ [ 76.16, 233.04, 303.32, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on the left wearing plaid shirt.", "normal_caption": "person on the left wearing plaid shirt", "solution": [ 76.16, 233.04, 304.32, 640.0 ], "normalized_solution": [ 148, 364, 594, 1000 ] }, { "height": 640, "width": 512, "id": 697, "original_id": 480123, "dataset_name": "refcoco", "area": 27502.088949999998, "iscrowd": 0, "image_id": 697, "category_id": 1, "bbox_list": [ [ 76.16, 233.04, 303.32, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person behind pink.", "normal_caption": "person behind pink", "solution": [ 76.16, 233.04, 304.32, 640.0 ], "normalized_solution": [ 148, 364, 594, 1000 ] }, { "height": 640, "width": 512, "id": 698, "original_id": 480123, "dataset_name": "refcoco", "area": 27502.088949999998, "iscrowd": 0, "image_id": 698, "category_id": 1, "bbox_list": [ [ 76.16, 233.04, 303.32, 639.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578718.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the person in the plaid shirt kind of blocked by the lady in pink.", "normal_caption": "the person in the plaid shirt kind of blocked by the lady in pink", "solution": [ 76.16, 233.04, 304.32, 640.0 ], "normalized_solution": [ 148, 364, 594, 1000 ] }, { "height": 640, "width": 478, "id": 699, "original_id": 1560572, "dataset_name": "refcoco", "area": 19476.45845, "iscrowd": 0, "image_id": 699, "category_id": 56, "bbox_list": [ [ 64.93, 460.14, 244.01000000000002, 623.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578702.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: piece of broccoli nearest to you.", "normal_caption": "piece of broccoli nearest to you", "solution": [ 64.93, 460.14, 245.01, 624.11 ], "normalized_solution": [ 135, 718, 512, 975 ] }, { "height": 640, "width": 478, "id": 700, "original_id": 1560572, "dataset_name": "refcoco", "area": 19476.45845, "iscrowd": 0, "image_id": 700, "category_id": 56, "bbox_list": [ [ 64.93, 460.14, 244.01000000000002, 623.11 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578702.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left piece of broccoli.", "normal_caption": "bottom left piece of broccoli", "solution": [ 64.93, 460.14, 245.01, 624.11 ], "normalized_solution": [ 135, 718, 512, 975 ] }, { "height": 640, "width": 478, "id": 701, "original_id": 1058309, "dataset_name": "refcoco", "area": 20779.098349999997, "iscrowd": 0, "image_id": 701, "category_id": 56, "bbox_list": [ [ 121.98, 296.66, 309.21, 453.78000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578702.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccolli stir fry.", "normal_caption": "broccolli stir fry", "solution": [ 121.98, 296.66, 310.21, 454.78 ], "normalized_solution": [ 255, 463, 648, 710 ] }, { "height": 640, "width": 478, "id": 702, "original_id": 1058309, "dataset_name": "refcoco", "area": 20779.098349999997, "iscrowd": 0, "image_id": 702, "category_id": 56, "bbox_list": [ [ 121.98, 296.66, 309.21, 453.78000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578702.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccoli dead center.", "normal_caption": "broccoli dead center", "solution": [ 121.98, 296.66, 310.21, 454.78 ], "normalized_solution": [ 255, 463, 648, 710 ] }, { "height": 640, "width": 478, "id": 703, "original_id": 1058309, "dataset_name": "refcoco", "area": 20779.098349999997, "iscrowd": 0, "image_id": 703, "category_id": 56, "bbox_list": [ [ 121.98, 296.66, 309.21, 453.78000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578702.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broc center of pic.", "normal_caption": "broc center of pic", "solution": [ 121.98, 296.66, 310.21, 454.78 ], "normalized_solution": [ 255, 463, 648, 710 ] }, { "height": 480, "width": 640, "id": 704, "original_id": 1543878, "dataset_name": "refcoco", "area": 24466.1852, "iscrowd": 0, "image_id": 704, "category_id": 52, "bbox_list": [ [ 195.16, 18.46, 412.25, 171.36 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578652.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle cluster of bananas at the top.", "normal_caption": "middle cluster of bananas at the top", "solution": [ 195.16, 18.46, 413.25, 172.36 ], "normalized_solution": [ 304, 38, 645, 359 ] }, { "height": 480, "width": 640, "id": 705, "original_id": 1543878, "dataset_name": "refcoco", "area": 24466.1852, "iscrowd": 0, "image_id": 705, "category_id": 52, "bbox_list": [ [ 195.16, 18.46, 412.25, 171.36 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578652.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top.", "normal_caption": "top", "solution": [ 195.16, 18.46, 413.25, 172.36 ], "normalized_solution": [ 304, 38, 645, 359 ] }, { "height": 480, "width": 640, "id": 706, "original_id": 1543878, "dataset_name": "refcoco", "area": 24466.1852, "iscrowd": 0, "image_id": 706, "category_id": 52, "bbox_list": [ [ 195.16, 18.46, 412.25, 171.36 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578652.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top small bunch of bananas.", "normal_caption": "top small bunch of bananas", "solution": [ 195.16, 18.46, 413.25, 172.36 ], "normalized_solution": [ 304, 38, 645, 359 ] }, { "height": 640, "width": 640, "id": 707, "original_id": 64665, "dataset_name": "refcoco", "area": 17609.23925, "iscrowd": 0, "image_id": 707, "category_id": 20, "bbox_list": [ [ 124.14, 370.34, 350.72, 500.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578649.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: little sheep in the front.", "normal_caption": "little sheep in the front", "solution": [ 124.14, 370.34, 351.72, 501.38 ], "normalized_solution": [ 193, 578, 549, 783 ] }, { "height": 640, "width": 640, "id": 708, "original_id": 64665, "dataset_name": "refcoco", "area": 17609.23925, "iscrowd": 0, "image_id": 708, "category_id": 20, "bbox_list": [ [ 124.14, 370.34, 350.72, 500.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578649.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom sheep below other.", "normal_caption": "bottom sheep below other", "solution": [ 124.14, 370.34, 351.72, 501.38 ], "normalized_solution": [ 193, 578, 549, 783 ] }, { "height": 640, "width": 640, "id": 709, "original_id": 64665, "dataset_name": "refcoco", "area": 17609.23925, "iscrowd": 0, "image_id": 709, "category_id": 20, "bbox_list": [ [ 124.14, 370.34, 350.72, 500.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578649.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom lamb.", "normal_caption": "bottom lamb", "solution": [ 124.14, 370.34, 351.72, 501.38 ], "normalized_solution": [ 193, 578, 549, 783 ] }, { "height": 640, "width": 480, "id": 710, "original_id": 1189616, "dataset_name": "refcoco", "area": 25733.184150000005, "iscrowd": 0, "image_id": 710, "category_id": 1, "bbox_list": [ [ 287.64, 435.78, 479.0, 626.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578626.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: partial person bottom right.", "normal_caption": "partial person bottom right", "solution": [ 287.64, 435.78, 480.0, 627.06 ], "normalized_solution": [ 599, 680, 1000, 979 ] }, { "height": 640, "width": 480, "id": 711, "original_id": 1189616, "dataset_name": "refcoco", "area": 25733.184150000005, "iscrowd": 0, "image_id": 711, "category_id": 1, "bbox_list": [ [ 287.64, 435.78, 479.0, 626.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578626.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: crouching girl front.", "normal_caption": "crouching girl front", "solution": [ 287.64, 435.78, 480.0, 627.06 ], "normalized_solution": [ 599, 680, 1000, 979 ] }, { "height": 640, "width": 480, "id": 712, "original_id": 1189616, "dataset_name": "refcoco", "area": 25733.184150000005, "iscrowd": 0, "image_id": 712, "category_id": 1, "bbox_list": [ [ 287.64, 435.78, 479.0, 626.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578626.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman laying on right.", "normal_caption": "woman laying on right", "solution": [ 287.64, 435.78, 480.0, 627.06 ], "normalized_solution": [ 599, 680, 1000, 979 ] }, { "height": 640, "width": 480, "id": 713, "original_id": 425833, "dataset_name": "refcoco", "area": 16343.787800000004, "iscrowd": 0, "image_id": 713, "category_id": 1, "bbox_list": [ [ 348.04, 313.53, 476.48, 512.4399999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578626.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: womans head.", "normal_caption": "womans head", "solution": [ 348.04, 313.53, 477.48, 513.44 ], "normalized_solution": [ 725, 489, 994, 802 ] }, { "height": 640, "width": 480, "id": 714, "original_id": 425833, "dataset_name": "refcoco", "area": 16343.787800000004, "iscrowd": 0, "image_id": 714, "category_id": 1, "bbox_list": [ [ 348.04, 313.53, 476.48, 512.4399999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578626.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girls head sitting up.", "normal_caption": "girls head sitting up", "solution": [ 348.04, 313.53, 477.48, 513.44 ], "normalized_solution": [ 725, 489, 994, 802 ] }, { "height": 640, "width": 480, "id": 715, "original_id": 425833, "dataset_name": "refcoco", "area": 16343.787800000004, "iscrowd": 0, "image_id": 715, "category_id": 1, "bbox_list": [ [ 348.04, 313.53, 476.48, 512.4399999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578626.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right top person.", "normal_caption": "right top person", "solution": [ 348.04, 313.53, 477.48, 513.44 ], "normalized_solution": [ 725, 489, 994, 802 ] }, { "height": 640, "width": 640, "id": 716, "original_id": 507371, "dataset_name": "refcoco", "area": 17166.3507, "iscrowd": 0, "image_id": 716, "category_id": 1, "bbox_list": [ [ 484.32, 238.56, 602.96, 509.99 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578567.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white uniform.", "normal_caption": "white uniform", "solution": [ 484.32, 238.56, 603.96, 510.99 ], "normalized_solution": [ 756, 372, 943, 798 ] }, { "height": 640, "width": 640, "id": 717, "original_id": 507371, "dataset_name": "refcoco", "area": 17166.3507, "iscrowd": 0, "image_id": 717, "category_id": 1, "bbox_list": [ [ 484.32, 238.56, 602.96, 509.99 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578567.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player on right.", "normal_caption": "player on right", "solution": [ 484.32, 238.56, 603.96, 510.99 ], "normalized_solution": [ 756, 372, 943, 798 ] }, { "height": 640, "width": 640, "id": 718, "original_id": 507371, "dataset_name": "refcoco", "area": 17166.3507, "iscrowd": 0, "image_id": 718, "category_id": 1, "bbox_list": [ [ 484.32, 238.56, 602.96, 509.99 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578567.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: player in white.", "normal_caption": "player in white", "solution": [ 484.32, 238.56, 603.96, 510.99 ], "normalized_solution": [ 756, 372, 943, 798 ] }, { "height": 640, "width": 640, "id": 719, "original_id": 425230, "dataset_name": "refcoco", "area": 41084.139650000005, "iscrowd": 0, "image_id": 719, "category_id": 1, "bbox_list": [ [ 96.14, 172.13, 283.13, 624.5799999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578567.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pitcher.", "normal_caption": "pitcher", "solution": [ 96.14, 172.13, 284.13, 625.58 ], "normalized_solution": [ 150, 268, 443, 977 ] }, { "height": 640, "width": 640, "id": 720, "original_id": 425230, "dataset_name": "refcoco", "area": 41084.139650000005, "iscrowd": 0, "image_id": 720, "category_id": 1, "bbox_list": [ [ 96.14, 172.13, 283.13, 624.5799999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578567.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pitcher.", "normal_caption": "pitcher", "solution": [ 96.14, 172.13, 284.13, 625.58 ], "normalized_solution": [ 150, 268, 443, 977 ] }, { "height": 640, "width": 640, "id": 721, "original_id": 425230, "dataset_name": "refcoco", "area": 41084.139650000005, "iscrowd": 0, "image_id": 721, "category_id": 1, "bbox_list": [ [ 96.14, 172.13, 283.13, 624.5799999999999 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578567.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid in blue.", "normal_caption": "kid in blue", "solution": [ 96.14, 172.13, 284.13, 625.58 ], "normalized_solution": [ 150, 268, 443, 977 ] }, { "height": 480, "width": 640, "id": 722, "original_id": 558691, "dataset_name": "refcoco", "area": 33124.37965, "iscrowd": 0, "image_id": 722, "category_id": 1, "bbox_list": [ [ 435.87, 10.33, 639.0, 245.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: old dude chillin.", "normal_caption": "old dude chillin", "solution": [ 435.87, 10.33, 640.0, 246.03 ], "normalized_solution": [ 681, 21, 1000, 512 ] }, { "height": 480, "width": 640, "id": 723, "original_id": 558691, "dataset_name": "refcoco", "area": 33124.37965, "iscrowd": 0, "image_id": 723, "category_id": 1, "bbox_list": [ [ 435.87, 10.33, 639.0, 245.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the guy with glasses.", "normal_caption": "the guy with glasses", "solution": [ 435.87, 10.33, 640.0, 246.03 ], "normalized_solution": [ 681, 21, 1000, 512 ] }, { "height": 480, "width": 640, "id": 724, "original_id": 558691, "dataset_name": "refcoco", "area": 33124.37965, "iscrowd": 0, "image_id": 724, "category_id": 1, "bbox_list": [ [ 435.87, 10.33, 639.0, 245.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy right.", "normal_caption": "guy right", "solution": [ 435.87, 10.33, 640.0, 246.03 ], "normalized_solution": [ 681, 21, 1000, 512 ] }, { "height": 480, "width": 640, "id": 725, "original_id": 443430, "dataset_name": "refcoco", "area": 65392.12195000001, "iscrowd": 0, "image_id": 725, "category_id": 1, "bbox_list": [ [ 56.09, 24.81, 308.57, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue.", "normal_caption": "blue", "solution": [ 56.09, 24.81, 309.57, 480.0 ], "normalized_solution": [ 87, 51, 483, 1000 ] }, { "height": 480, "width": 640, "id": 726, "original_id": 443430, "dataset_name": "refcoco", "area": 65392.12195000001, "iscrowd": 0, "image_id": 726, "category_id": 1, "bbox_list": [ [ 56.09, 24.81, 308.57, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue shrt.", "normal_caption": "blue shrt", "solution": [ 56.09, 24.81, 309.57, 480.0 ], "normalized_solution": [ 87, 51, 483, 1000 ] }, { "height": 480, "width": 640, "id": 727, "original_id": 443430, "dataset_name": "refcoco", "area": 65392.12195000001, "iscrowd": 0, "image_id": 727, "category_id": 1, "bbox_list": [ [ 56.09, 24.81, 308.57, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578523.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady.", "normal_caption": "lady", "solution": [ 56.09, 24.81, 309.57, 480.0 ], "normalized_solution": [ 87, 51, 483, 1000 ] }, { "height": 480, "width": 640, "id": 728, "original_id": 525163, "dataset_name": "refcoco", "area": 65255.980899999995, "iscrowd": 0, "image_id": 728, "category_id": 1, "bbox_list": [ [ 1.08, 4.13, 280.53, 474.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578521.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on left black jacket half in frame.", "normal_caption": "guy on left black jacket half in frame", "solution": [ 1.08, 4.13, 281.53, 475.51 ], "normalized_solution": [ 1, 8, 439, 990 ] }, { "height": 480, "width": 640, "id": 729, "original_id": 525163, "dataset_name": "refcoco", "area": 65255.980899999995, "iscrowd": 0, "image_id": 729, "category_id": 1, "bbox_list": [ [ 1.08, 4.13, 280.53, 474.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578521.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man with back to us in front.", "normal_caption": "man with back to us in front", "solution": [ 1.08, 4.13, 281.53, 475.51 ], "normalized_solution": [ 1, 8, 439, 990 ] }, { "height": 480, "width": 640, "id": 730, "original_id": 525163, "dataset_name": "refcoco", "area": 65255.980899999995, "iscrowd": 0, "image_id": 730, "category_id": 1, "bbox_list": [ [ 1.08, 4.13, 280.53, 474.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578521.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on left back to pic.", "normal_caption": "man on left back to pic", "solution": [ 1.08, 4.13, 281.53, 475.51 ], "normalized_solution": [ 1, 8, 439, 990 ] }, { "height": 480, "width": 640, "id": 731, "original_id": 524828, "dataset_name": "refcoco", "area": 29765.643799999998, "iscrowd": 0, "image_id": 731, "category_id": 1, "bbox_list": [ [ 225.59, 52.48, 407.48, 384.53000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578521.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man at center.", "normal_caption": "man at center", "solution": [ 225.59, 52.48, 408.48, 385.53 ], "normalized_solution": [ 352, 109, 638, 803 ] }, { "height": 480, "width": 640, "id": 732, "original_id": 524828, "dataset_name": "refcoco", "area": 29765.643799999998, "iscrowd": 0, "image_id": 732, "category_id": 1, "bbox_list": [ [ 225.59, 52.48, 407.48, 384.53000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578521.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: a man about to dab into some food with his utencil.", "normal_caption": "a man about to dab into some food with his utencil", "solution": [ 225.59, 52.48, 408.48, 385.53 ], "normalized_solution": [ 352, 109, 638, 803 ] }, { "height": 480, "width": 640, "id": 733, "original_id": 524828, "dataset_name": "refcoco", "area": 29765.643799999998, "iscrowd": 0, "image_id": 733, "category_id": 1, "bbox_list": [ [ 225.59, 52.48, 407.48, 384.53000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578521.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in middle with plate.", "normal_caption": "guy in middle with plate", "solution": [ 225.59, 52.48, 408.48, 385.53 ], "normalized_solution": [ 352, 109, 638, 803 ] }, { "height": 480, "width": 640, "id": 734, "original_id": 212070, "dataset_name": "refcoco", "area": 25015.156900000013, "iscrowd": 0, "image_id": 734, "category_id": 1, "bbox_list": [ [ 175.5, 209.74, 326.62, 476.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: little girl.", "normal_caption": "little girl", "solution": [ 175.5, 209.74, 327.62, 477.85 ], "normalized_solution": [ 274, 436, 511, 995 ] }, { "height": 480, "width": 640, "id": 735, "original_id": 212070, "dataset_name": "refcoco", "area": 25015.156900000013, "iscrowd": 0, "image_id": 735, "category_id": 1, "bbox_list": [ [ 175.5, 209.74, 326.62, 476.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the little girl.", "normal_caption": "the little girl", "solution": [ 175.5, 209.74, 327.62, 477.85 ], "normalized_solution": [ 274, 436, 511, 995 ] }, { "height": 480, "width": 640, "id": 736, "original_id": 212070, "dataset_name": "refcoco", "area": 25015.156900000013, "iscrowd": 0, "image_id": 736, "category_id": 1, "bbox_list": [ [ 175.5, 209.74, 326.62, 476.85 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid.", "normal_caption": "kid", "solution": [ 175.5, 209.74, 327.62, 477.85 ], "normalized_solution": [ 274, 436, 511, 995 ] }, { "height": 480, "width": 640, "id": 737, "original_id": 193952, "dataset_name": "refcoco", "area": 57847.39555, "iscrowd": 0, "image_id": 737, "category_id": 1, "bbox_list": [ [ 348.7, 144.22, 639.0, 473.62 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in purple.", "normal_caption": "girl in purple", "solution": [ 348.7, 144.22, 640.0, 474.62 ], "normalized_solution": [ 544, 300, 1000, 988 ] }, { "height": 480, "width": 640, "id": 738, "original_id": 193952, "dataset_name": "refcoco", "area": 57847.39555, "iscrowd": 0, "image_id": 738, "category_id": 1, "bbox_list": [ [ 348.7, 144.22, 639.0, 473.62 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady in purple.", "normal_caption": "lady in purple", "solution": [ 348.7, 144.22, 640.0, 474.62 ], "normalized_solution": [ 544, 300, 1000, 988 ] }, { "height": 480, "width": 640, "id": 739, "original_id": 193952, "dataset_name": "refcoco", "area": 57847.39555, "iscrowd": 0, "image_id": 739, "category_id": 1, "bbox_list": [ [ 348.7, 144.22, 639.0, 473.62 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl on right.", "normal_caption": "girl on right", "solution": [ 348.7, 144.22, 640.0, 474.62 ], "normalized_solution": [ 544, 300, 1000, 988 ] }, { "height": 480, "width": 640, "id": 740, "original_id": 62574, "dataset_name": "refcoco", "area": 40528.15400000002, "iscrowd": 0, "image_id": 740, "category_id": 20, "bbox_list": [ [ 268.16, 153.72, 512.04, 456.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sheep by girl.", "normal_caption": "sheep by girl", "solution": [ 268.16, 153.72, 513.04, 457.01 ], "normalized_solution": [ 419, 320, 801, 952 ] }, { "height": 480, "width": 640, "id": 741, "original_id": 62574, "dataset_name": "refcoco", "area": 40528.15400000002, "iscrowd": 0, "image_id": 741, "category_id": 20, "bbox_list": [ [ 268.16, 153.72, 512.04, 456.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sheep being fed.", "normal_caption": "sheep being fed", "solution": [ 268.16, 153.72, 513.04, 457.01 ], "normalized_solution": [ 419, 320, 801, 952 ] }, { "height": 480, "width": 640, "id": 742, "original_id": 62574, "dataset_name": "refcoco", "area": 40528.15400000002, "iscrowd": 0, "image_id": 742, "category_id": 20, "bbox_list": [ [ 268.16, 153.72, 512.04, 456.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578519.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sheep being petted.", "normal_caption": "sheep being petted", "solution": [ 268.16, 153.72, 513.04, 457.01 ], "normalized_solution": [ 419, 320, 801, 952 ] }, { "height": 427, "width": 640, "id": 743, "original_id": 1234853, "dataset_name": "refcoco", "area": 16919.754150000004, "iscrowd": 0, "image_id": 743, "category_id": 1, "bbox_list": [ [ 0.0, 216.7, 143.89, 398.97 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578513.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: he is the catching for baseballt.", "normal_caption": "he is the catching for baseballt", "solution": [ 0.0, 216.7, 144.89, 399.97 ], "normalized_solution": [ 0, 507, 226, 936 ] }, { "height": 427, "width": 640, "id": 744, "original_id": 1234853, "dataset_name": "refcoco", "area": 16919.754150000004, "iscrowd": 0, "image_id": 744, "category_id": 1, "bbox_list": [ [ 0.0, 216.7, 143.89, 398.97 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578513.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: catcher.", "normal_caption": "catcher", "solution": [ 0.0, 216.7, 144.89, 399.97 ], "normalized_solution": [ 0, 507, 226, 936 ] }, { "height": 427, "width": 640, "id": 745, "original_id": 1234853, "dataset_name": "refcoco", "area": 16919.754150000004, "iscrowd": 0, "image_id": 745, "category_id": 1, "bbox_list": [ [ 0.0, 216.7, 143.89, 398.97 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578513.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: catcher.", "normal_caption": "catcher", "solution": [ 0.0, 216.7, 144.89, 399.97 ], "normalized_solution": [ 0, 507, 226, 936 ] }, { "height": 427, "width": 640, "id": 746, "original_id": 1212565, "dataset_name": "refcoco", "area": 22820.11515, "iscrowd": 0, "image_id": 746, "category_id": 1, "bbox_list": [ [ 136.64, 107.12, 327.03999999999996, 407.05 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578513.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: number 19.", "normal_caption": "number 19", "solution": [ 136.64, 107.12, 328.04, 408.05 ], "normalized_solution": [ 213, 250, 512, 955 ] }, { "height": 427, "width": 640, "id": 747, "original_id": 1212565, "dataset_name": "refcoco", "area": 22820.11515, "iscrowd": 0, "image_id": 747, "category_id": 1, "bbox_list": [ [ 136.64, 107.12, 327.03999999999996, 407.05 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578513.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the batter.", "normal_caption": "the batter", "solution": [ 136.64, 107.12, 328.04, 408.05 ], "normalized_solution": [ 213, 250, 512, 955 ] }, { "height": 427, "width": 640, "id": 748, "original_id": 1212565, "dataset_name": "refcoco", "area": 22820.11515, "iscrowd": 0, "image_id": 748, "category_id": 1, "bbox_list": [ [ 136.64, 107.12, 327.03999999999996, 407.05 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578513.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: baseball player.", "normal_caption": "baseball player", "solution": [ 136.64, 107.12, 328.04, 408.05 ], "normalized_solution": [ 213, 250, 512, 955 ] }, { "height": 480, "width": 640, "id": 749, "original_id": 1281449, "dataset_name": "refcoco", "area": 43015.387950000004, "iscrowd": 0, "image_id": 749, "category_id": 1, "bbox_list": [ [ 0.0, 26.64, 209.34, 471.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left woman in blk.", "normal_caption": "left woman in blk", "solution": [ 0.0, 26.64, 210.34, 472.12 ], "normalized_solution": [ 0, 55, 328, 983 ] }, { "height": 480, "width": 640, "id": 750, "original_id": 1281449, "dataset_name": "refcoco", "area": 43015.387950000004, "iscrowd": 0, "image_id": 750, "category_id": 1, "bbox_list": [ [ 0.0, 26.64, 209.34, 471.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left lady black dress.", "normal_caption": "left lady black dress", "solution": [ 0.0, 26.64, 210.34, 472.12 ], "normalized_solution": [ 0, 55, 328, 983 ] }, { "height": 480, "width": 640, "id": 751, "original_id": 1281449, "dataset_name": "refcoco", "area": 43015.387950000004, "iscrowd": 0, "image_id": 751, "category_id": 1, "bbox_list": [ [ 0.0, 26.64, 209.34, 471.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman left in black.", "normal_caption": "woman left in black", "solution": [ 0.0, 26.64, 210.34, 472.12 ], "normalized_solution": [ 0, 55, 328, 983 ] }, { "height": 480, "width": 640, "id": 752, "original_id": 1279737, "dataset_name": "refcoco", "area": 16328.9679, "iscrowd": 0, "image_id": 752, "category_id": 1, "bbox_list": [ [ 174.65, 240.36, 277.31, 470.34000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue kid close to cam on left.", "normal_caption": "blue kid close to cam on left", "solution": [ 174.65, 240.36, 278.31, 471.34 ], "normalized_solution": [ 272, 500, 434, 981 ] }, { "height": 480, "width": 640, "id": 753, "original_id": 1279737, "dataset_name": "refcoco", "area": 16328.9679, "iscrowd": 0, "image_id": 753, "category_id": 1, "bbox_list": [ [ 174.65, 240.36, 277.31, 470.34000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: light blue shirt under womans hand.", "normal_caption": "light blue shirt under womans hand", "solution": [ 174.65, 240.36, 278.31, 471.34 ], "normalized_solution": [ 272, 500, 434, 981 ] }, { "height": 480, "width": 640, "id": 754, "original_id": 1279737, "dataset_name": "refcoco", "area": 16328.9679, "iscrowd": 0, "image_id": 754, "category_id": 1, "bbox_list": [ [ 174.65, 240.36, 277.31, 470.34000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid light blue shirt near woman bottom.", "normal_caption": "kid light blue shirt near woman bottom", "solution": [ 174.65, 240.36, 278.31, 471.34 ], "normalized_solution": [ 272, 500, 434, 981 ] }, { "height": 480, "width": 640, "id": 755, "original_id": 1270453, "dataset_name": "refcoco", "area": 15607.360400000003, "iscrowd": 0, "image_id": 755, "category_id": 1, "bbox_list": [ [ 271.59, 268.95, 382.42999999999995, 478.7 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: child in front without shirt.", "normal_caption": "child in front without shirt", "solution": [ 271.59, 268.95, 383.43, 479.7 ], "normalized_solution": [ 424, 560, 599, 999 ] }, { "height": 480, "width": 640, "id": 756, "original_id": 1270453, "dataset_name": "refcoco", "area": 15607.360400000003, "iscrowd": 0, "image_id": 756, "category_id": 1, "bbox_list": [ [ 271.59, 268.95, 382.42999999999995, 478.7 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: kid bottom no shirt.", "normal_caption": "kid bottom no shirt", "solution": [ 271.59, 268.95, 383.43, 479.7 ], "normalized_solution": [ 424, 560, 599, 999 ] }, { "height": 480, "width": 640, "id": 757, "original_id": 1270453, "dataset_name": "refcoco", "area": 15607.360400000003, "iscrowd": 0, "image_id": 757, "category_id": 1, "bbox_list": [ [ 271.59, 268.95, 382.42999999999995, 478.7 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy with no shirt.", "normal_caption": "boy with no shirt", "solution": [ 271.59, 268.95, 383.43, 479.7 ], "normalized_solution": [ 424, 560, 599, 999 ] }, { "height": 480, "width": 640, "id": 758, "original_id": 1253842, "dataset_name": "refcoco", "area": 12380.807399999998, "iscrowd": 0, "image_id": 758, "category_id": 1, "bbox_list": [ [ 276.02, 67.39, 457.17999999999995, 260.45 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in cap.", "normal_caption": "guy in cap", "solution": [ 276.02, 67.39, 458.18, 261.45 ], "normalized_solution": [ 431, 140, 715, 544 ] }, { "height": 480, "width": 640, "id": 759, "original_id": 1253842, "dataset_name": "refcoco", "area": 12380.807399999998, "iscrowd": 0, "image_id": 759, "category_id": 1, "bbox_list": [ [ 276.02, 67.39, 457.17999999999995, 260.45 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in red shirt black hat reaching over table.", "normal_caption": "man in red shirt black hat reaching over table", "solution": [ 276.02, 67.39, 458.18, 261.45 ], "normalized_solution": [ 431, 140, 715, 544 ] }, { "height": 480, "width": 640, "id": 760, "original_id": 1253842, "dataset_name": "refcoco", "area": 12380.807399999998, "iscrowd": 0, "image_id": 760, "category_id": 1, "bbox_list": [ [ 276.02, 67.39, 457.17999999999995, 260.45 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man standing over table red shirt.", "normal_caption": "man standing over table red shirt", "solution": [ 276.02, 67.39, 458.18, 261.45 ], "normalized_solution": [ 431, 140, 715, 544 ] }, { "height": 480, "width": 640, "id": 761, "original_id": 1215841, "dataset_name": "refcoco", "area": 13354.79825, "iscrowd": 0, "image_id": 761, "category_id": 1, "bbox_list": [ [ 520.47, 328.52, 639.0, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom right kid.", "normal_caption": "bottom right kid", "solution": [ 520.47, 328.52, 640.0, 480.0 ], "normalized_solution": [ 813, 684, 1000, 1000 ] }, { "height": 480, "width": 640, "id": 762, "original_id": 1215841, "dataset_name": "refcoco", "area": 13354.79825, "iscrowd": 0, "image_id": 762, "category_id": 1, "bbox_list": [ [ 520.47, 328.52, 639.0, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy on right edge of pic in blue tshirt.", "normal_caption": "boy on right edge of pic in blue tshirt", "solution": [ 520.47, 328.52, 640.0, 480.0 ], "normalized_solution": [ 813, 684, 1000, 1000 ] }, { "height": 480, "width": 640, "id": 763, "original_id": 1210865, "dataset_name": "refcoco", "area": 19314.658150000003, "iscrowd": 0, "image_id": 763, "category_id": 1, "bbox_list": [ [ 374.29, 279.37, 513.52, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy bottom white shirt.", "normal_caption": "boy bottom white shirt", "solution": [ 374.29, 279.37, 514.52, 474.61 ], "normalized_solution": [ 584, 582, 803, 988 ] }, { "height": 480, "width": 640, "id": 764, "original_id": 1210865, "dataset_name": "refcoco", "area": 19314.658150000003, "iscrowd": 0, "image_id": 764, "category_id": 1, "bbox_list": [ [ 374.29, 279.37, 513.52, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: boy with white top.", "normal_caption": "boy with white top", "solution": [ 374.29, 279.37, 514.52, 474.61 ], "normalized_solution": [ 584, 582, 803, 988 ] }, { "height": 480, "width": 640, "id": 765, "original_id": 1210865, "dataset_name": "refcoco", "area": 19314.658150000003, "iscrowd": 0, "image_id": 765, "category_id": 1, "bbox_list": [ [ 374.29, 279.37, 513.52, 473.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second from lowerright white shirt orange accents.", "normal_caption": "second from lowerright white shirt orange accents", "solution": [ 374.29, 279.37, 514.52, 474.61 ], "normalized_solution": [ 584, 582, 803, 988 ] }, { "height": 480, "width": 640, "id": 766, "original_id": 2013924, "dataset_name": "refcoco", "area": 12758.917049999998, "iscrowd": 0, "image_id": 766, "category_id": 1, "bbox_list": [ [ 180.17, 0.43, 289.07, 193.67000000000002 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in back in black tank top.", "normal_caption": "woman in back in black tank top", "solution": [ 180.17, 0.43, 290.07, 194.67 ], "normalized_solution": [ 281, 0, 453, 405 ] }, { "height": 480, "width": 640, "id": 767, "original_id": 2013924, "dataset_name": "refcoco", "area": 12758.917049999998, "iscrowd": 0, "image_id": 767, "category_id": 1, "bbox_list": [ [ 180.17, 0.43, 289.07, 193.67000000000002 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black tank top standing in back.", "normal_caption": "black tank top standing in back", "solution": [ 180.17, 0.43, 290.07, 194.67 ], "normalized_solution": [ 281, 0, 453, 405 ] }, { "height": 480, "width": 640, "id": 768, "original_id": 2013924, "dataset_name": "refcoco", "area": 12758.917049999998, "iscrowd": 0, "image_id": 768, "category_id": 1, "bbox_list": [ [ 180.17, 0.43, 289.07, 193.67000000000002 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578459.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in black tank top and floral bottoms.", "normal_caption": "woman in black tank top and floral bottoms", "solution": [ 180.17, 0.43, 290.07, 194.67 ], "normalized_solution": [ 281, 0, 453, 405 ] }, { "height": 480, "width": 640, "id": 769, "original_id": 1397960, "dataset_name": "refcoco", "area": 31628.940450000002, "iscrowd": 0, "image_id": 769, "category_id": 15, "bbox_list": [ [ 0.0, 204.24, 249.91, 456.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578375.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left pink chair.", "normal_caption": "left pink chair", "solution": [ 0.0, 204.24, 250.91, 457.73 ], "normalized_solution": [ 0, 425, 392, 953 ] }, { "height": 480, "width": 640, "id": 770, "original_id": 1397960, "dataset_name": "refcoco", "area": 31628.940450000002, "iscrowd": 0, "image_id": 770, "category_id": 15, "bbox_list": [ [ 0.0, 204.24, 249.91, 456.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578375.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left bench pink colored.", "normal_caption": "left bench pink colored", "solution": [ 0.0, 204.24, 250.91, 457.73 ], "normalized_solution": [ 0, 425, 392, 953 ] }, { "height": 480, "width": 640, "id": 771, "original_id": 1397960, "dataset_name": "refcoco", "area": 31628.940450000002, "iscrowd": 0, "image_id": 771, "category_id": 15, "bbox_list": [ [ 0.0, 204.24, 249.91, 456.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578375.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink bench left.", "normal_caption": "pink bench left", "solution": [ 0.0, 204.24, 250.91, 457.73 ], "normalized_solution": [ 0, 425, 392, 953 ] }, { "height": 480, "width": 640, "id": 772, "original_id": 1810402, "dataset_name": "refcoco", "area": 10842.990599999997, "iscrowd": 0, "image_id": 772, "category_id": 15, "bbox_list": [ [ 39.1, 158.44, 223.94, 298.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578375.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange seat.", "normal_caption": "orange seat", "solution": [ 39.1, 158.44, 224.94, 299.51 ], "normalized_solution": [ 61, 330, 351, 623 ] }, { "height": 480, "width": 640, "id": 773, "original_id": 1810402, "dataset_name": "refcoco", "area": 10842.990599999997, "iscrowd": 0, "image_id": 773, "category_id": 15, "bbox_list": [ [ 39.1, 158.44, 223.94, 298.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578375.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange seat.", "normal_caption": "orange seat", "solution": [ 39.1, 158.44, 224.94, 299.51 ], "normalized_solution": [ 61, 330, 351, 623 ] }, { "height": 480, "width": 640, "id": 774, "original_id": 1810402, "dataset_name": "refcoco", "area": 10842.990599999997, "iscrowd": 0, "image_id": 774, "category_id": 15, "bbox_list": [ [ 39.1, 158.44, 223.94, 298.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578375.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange seat.", "normal_caption": "orange seat", "solution": [ 39.1, 158.44, 224.94, 299.51 ], "normalized_solution": [ 61, 330, 351, 623 ] }, { "height": 612, "width": 612, "id": 775, "original_id": 423485, "dataset_name": "refcoco", "area": 59027.437450000005, "iscrowd": 0, "image_id": 775, "category_id": 1, "bbox_list": [ [ 0.0, 88.91, 291.22, 603.42 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578369.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on left.", "normal_caption": "guy on left", "solution": [ 0.0, 88.91, 292.22, 604.42 ], "normalized_solution": [ 0, 145, 477, 987 ] }, { "height": 612, "width": 612, "id": 776, "original_id": 423485, "dataset_name": "refcoco", "area": 59027.437450000005, "iscrowd": 0, "image_id": 776, "category_id": 1, "bbox_list": [ [ 0.0, 88.91, 291.22, 603.42 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578369.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lleft guy cut off.", "normal_caption": "lleft guy cut off", "solution": [ 0.0, 88.91, 292.22, 604.42 ], "normalized_solution": [ 0, 145, 477, 987 ] }, { "height": 612, "width": 612, "id": 777, "original_id": 423485, "dataset_name": "refcoco", "area": 59027.437450000005, "iscrowd": 0, "image_id": 777, "category_id": 1, "bbox_list": [ [ 0.0, 88.91, 291.22, 603.42 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578369.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy left purple on shirt.", "normal_caption": "guy left purple on shirt", "solution": [ 0.0, 88.91, 292.22, 604.42 ], "normalized_solution": [ 0, 145, 477, 987 ] }, { "height": 557, "width": 640, "id": 778, "original_id": 1715783, "dataset_name": "refcoco", "area": 61504.36495, "iscrowd": 0, "image_id": 778, "category_id": 1, "bbox_list": [ [ 359.23, 196.51, 639.0, 547.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578331.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right.", "normal_caption": "woman on right", "solution": [ 359.23, 196.51, 640.0, 548.24 ], "normalized_solution": [ 561, 352, 1000, 984 ] }, { "height": 557, "width": 640, "id": 779, "original_id": 1715783, "dataset_name": "refcoco", "area": 61504.36495, "iscrowd": 0, "image_id": 779, "category_id": 1, "bbox_list": [ [ 359.23, 196.51, 639.0, 547.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578331.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right.", "normal_caption": "woman on right", "solution": [ 359.23, 196.51, 640.0, 548.24 ], "normalized_solution": [ 561, 352, 1000, 984 ] }, { "height": 557, "width": 640, "id": 780, "original_id": 1715783, "dataset_name": "refcoco", "area": 61504.36495, "iscrowd": 0, "image_id": 780, "category_id": 1, "bbox_list": [ [ 359.23, 196.51, 639.0, 547.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578331.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right woman.", "normal_caption": "right woman", "solution": [ 359.23, 196.51, 640.0, 548.24 ], "normalized_solution": [ 561, 352, 1000, 984 ] }, { "height": 557, "width": 640, "id": 781, "original_id": 184388, "dataset_name": "refcoco", "area": 59090.86205000001, "iscrowd": 0, "image_id": 781, "category_id": 1, "bbox_list": [ [ 101.39, 160.22, 325.69, 547.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578331.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: yellow shirt.", "normal_caption": "yellow shirt", "solution": [ 101.39, 160.22, 326.69, 548.24 ], "normalized_solution": [ 158, 287, 510, 984 ] }, { "height": 557, "width": 640, "id": 782, "original_id": 184388, "dataset_name": "refcoco", "area": 59090.86205000001, "iscrowd": 0, "image_id": 782, "category_id": 1, "bbox_list": [ [ 101.39, 160.22, 325.69, 547.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578331.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: yellow shirt.", "normal_caption": "yellow shirt", "solution": [ 101.39, 160.22, 326.69, 548.24 ], "normalized_solution": [ 158, 287, 510, 984 ] }, { "height": 557, "width": 640, "id": 783, "original_id": 184388, "dataset_name": "refcoco", "area": 59090.86205000001, "iscrowd": 0, "image_id": 783, "category_id": 1, "bbox_list": [ [ 101.39, 160.22, 325.69, 547.24 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578331.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: yellow shirt.", "normal_caption": "yellow shirt", "solution": [ 101.39, 160.22, 326.69, 548.24 ], "normalized_solution": [ 158, 287, 510, 984 ] }, { "height": 480, "width": 640, "id": 784, "original_id": 449764, "dataset_name": "refcoco", "area": 43468.05360000001, "iscrowd": 0, "image_id": 784, "category_id": 1, "bbox_list": [ [ 156.4, 203.06, 421.83000000000004, 471.72 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578326.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in front.", "normal_caption": "guy in front", "solution": [ 156.4, 203.06, 422.83, 472.72 ], "normalized_solution": [ 244, 423, 660, 984 ] }, { "height": 480, "width": 640, "id": 785, "original_id": 449764, "dataset_name": "refcoco", "area": 43468.05360000001, "iscrowd": 0, "image_id": 785, "category_id": 1, "bbox_list": [ [ 156.4, 203.06, 421.83000000000004, 471.72 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578326.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man next to oven.", "normal_caption": "man next to oven", "solution": [ 156.4, 203.06, 422.83, 472.72 ], "normalized_solution": [ 244, 423, 660, 984 ] }, { "height": 480, "width": 640, "id": 786, "original_id": 449764, "dataset_name": "refcoco", "area": 43468.05360000001, "iscrowd": 0, "image_id": 786, "category_id": 1, "bbox_list": [ [ 156.4, 203.06, 421.83000000000004, 471.72 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578326.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy.", "normal_caption": "guy", "solution": [ 156.4, 203.06, 422.83, 472.72 ], "normalized_solution": [ 244, 423, 660, 984 ] }, { "height": 480, "width": 640, "id": 787, "original_id": 433685, "dataset_name": "refcoco", "area": 62796.78710000001, "iscrowd": 0, "image_id": 787, "category_id": 1, "bbox_list": [ [ 111.6, 5.15, 487.66999999999996, 473.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578326.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 111.6, 5.15, 488.67, 474.31 ], "normalized_solution": [ 174, 10, 763, 988 ] }, { "height": 480, "width": 640, "id": 788, "original_id": 433685, "dataset_name": "refcoco", "area": 62796.78710000001, "iscrowd": 0, "image_id": 788, "category_id": 1, "bbox_list": [ [ 111.6, 5.15, 487.66999999999996, 473.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578326.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 111.6, 5.15, 488.67, 474.31 ], "normalized_solution": [ 174, 10, 763, 988 ] }, { "height": 480, "width": 640, "id": 789, "original_id": 433685, "dataset_name": "refcoco", "area": 62796.78710000001, "iscrowd": 0, "image_id": 789, "category_id": 1, "bbox_list": [ [ 111.6, 5.15, 487.66999999999996, 473.31 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578326.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 111.6, 5.15, 488.67, 474.31 ], "normalized_solution": [ 174, 10, 763, 988 ] }, { "height": 508, "width": 640, "id": 790, "original_id": 462117, "dataset_name": "refcoco", "area": 38630.48305, "iscrowd": 0, "image_id": 790, "category_id": 1, "bbox_list": [ [ 92.47, 147.26, 304.94, 496.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578250.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on left.", "normal_caption": "woman on left", "solution": [ 92.47, 147.26, 305.94, 497.73 ], "normalized_solution": [ 144, 289, 478, 979 ] }, { "height": 508, "width": 640, "id": 791, "original_id": 462117, "dataset_name": "refcoco", "area": 38630.48305, "iscrowd": 0, "image_id": 791, "category_id": 1, "bbox_list": [ [ 92.47, 147.26, 304.94, 496.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578250.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: young woman on left.", "normal_caption": "young woman on left", "solution": [ 92.47, 147.26, 305.94, 497.73 ], "normalized_solution": [ 144, 289, 478, 979 ] }, { "height": 508, "width": 640, "id": 792, "original_id": 462117, "dataset_name": "refcoco", "area": 38630.48305, "iscrowd": 0, "image_id": 792, "category_id": 1, "bbox_list": [ [ 92.47, 147.26, 304.94, 496.73 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578250.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lady on left.", "normal_caption": "lady on left", "solution": [ 92.47, 147.26, 305.94, 497.73 ], "normalized_solution": [ 144, 289, 478, 979 ] }, { "height": 508, "width": 640, "id": 793, "original_id": 425947, "dataset_name": "refcoco", "area": 31881.394150000015, "iscrowd": 0, "image_id": 793, "category_id": 1, "bbox_list": [ [ 337.52, 157.32, 532.17, 499.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578250.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right.", "normal_caption": "woman on right", "solution": [ 337.52, 157.32, 533.17, 500.56 ], "normalized_solution": [ 527, 309, 833, 985 ] }, { "height": 508, "width": 640, "id": 794, "original_id": 425947, "dataset_name": "refcoco", "area": 31881.394150000015, "iscrowd": 0, "image_id": 794, "category_id": 1, "bbox_list": [ [ 337.52, 157.32, 532.17, 499.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578250.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right woman.", "normal_caption": "right woman", "solution": [ 337.52, 157.32, 533.17, 500.56 ], "normalized_solution": [ 527, 309, 833, 985 ] }, { "height": 508, "width": 640, "id": 795, "original_id": 425947, "dataset_name": "refcoco", "area": 31881.394150000015, "iscrowd": 0, "image_id": 795, "category_id": 1, "bbox_list": [ [ 337.52, 157.32, 532.17, 499.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578250.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right person.", "normal_caption": "right person", "solution": [ 337.52, 157.32, 533.17, 500.56 ], "normalized_solution": [ 527, 309, 833, 985 ] }, { "height": 360, "width": 640, "id": 796, "original_id": 112145, "dataset_name": "refcoco", "area": 11796.119250000002, "iscrowd": 0, "image_id": 796, "category_id": 63, "bbox_list": [ [ 0.0, 276.61, 265.7, 354.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578184.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left couch.", "normal_caption": "bottom left couch", "solution": [ 0.0, 276.61, 266.7, 355.92 ], "normalized_solution": [ 0, 768, 416, 988 ] }, { "height": 360, "width": 640, "id": 797, "original_id": 112145, "dataset_name": "refcoco", "area": 11796.119250000002, "iscrowd": 0, "image_id": 797, "category_id": 63, "bbox_list": [ [ 0.0, 276.61, 265.7, 354.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578184.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front couch.", "normal_caption": "front couch", "solution": [ 0.0, 276.61, 266.7, 355.92 ], "normalized_solution": [ 0, 768, 416, 988 ] }, { "height": 360, "width": 640, "id": 798, "original_id": 100049, "dataset_name": "refcoco", "area": 30920.395499999995, "iscrowd": 0, "image_id": 798, "category_id": 63, "bbox_list": [ [ 356.13, 190.45, 639.0, 352.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578184.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right couch.", "normal_caption": "right couch", "solution": [ 356.13, 190.45, 640.0, 353.81 ], "normalized_solution": [ 556, 529, 1000, 982 ] }, { "height": 360, "width": 640, "id": 799, "original_id": 100049, "dataset_name": "refcoco", "area": 30920.395499999995, "iscrowd": 0, "image_id": 799, "category_id": 63, "bbox_list": [ [ 356.13, 190.45, 639.0, 352.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578184.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sofa on right.", "normal_caption": "sofa on right", "solution": [ 356.13, 190.45, 640.0, 353.81 ], "normalized_solution": [ 556, 529, 1000, 982 ] }, { "height": 360, "width": 640, "id": 800, "original_id": 100049, "dataset_name": "refcoco", "area": 30920.395499999995, "iscrowd": 0, "image_id": 800, "category_id": 63, "bbox_list": [ [ 356.13, 190.45, 639.0, 352.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578184.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: couch on right.", "normal_caption": "couch on right", "solution": [ 356.13, 190.45, 640.0, 353.81 ], "normalized_solution": [ 556, 529, 1000, 982 ] }, { "height": 422, "width": 600, "id": 801, "original_id": 63397, "dataset_name": "refcoco", "area": 24004.804699999986, "iscrowd": 0, "image_id": 801, "category_id": 20, "bbox_list": [ [ 74.28, 121.59, 280.89, 387.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: lamb left.", "normal_caption": "lamb left", "solution": [ 74.28, 121.59, 281.89, 388.61 ], "normalized_solution": [ 123, 288, 469, 920 ] }, { "height": 422, "width": 600, "id": 802, "original_id": 63397, "dataset_name": "refcoco", "area": 24004.804699999986, "iscrowd": 0, "image_id": 802, "category_id": 20, "bbox_list": [ [ 74.28, 121.59, 280.89, 387.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left animal.", "normal_caption": "left animal", "solution": [ 74.28, 121.59, 281.89, 388.61 ], "normalized_solution": [ 123, 288, 469, 920 ] }, { "height": 422, "width": 600, "id": 803, "original_id": 63397, "dataset_name": "refcoco", "area": 24004.804699999986, "iscrowd": 0, "image_id": 803, "category_id": 20, "bbox_list": [ [ 74.28, 121.59, 280.89, 387.61 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: animal left.", "normal_caption": "animal left", "solution": [ 74.28, 121.59, 281.89, 388.61 ], "normalized_solution": [ 123, 288, 469, 920 ] }, { "height": 422, "width": 600, "id": 804, "original_id": 62460, "dataset_name": "refcoco", "area": 15997.72345, "iscrowd": 0, "image_id": 804, "category_id": 20, "bbox_list": [ [ 262.96, 141.1, 367.69, 403.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle sheep.", "normal_caption": "middle sheep", "solution": [ 262.96, 141.1, 368.69, 404.96 ], "normalized_solution": [ 438, 334, 614, 959 ] }, { "height": 422, "width": 600, "id": 805, "original_id": 62460, "dataset_name": "refcoco", "area": 15997.72345, "iscrowd": 0, "image_id": 805, "category_id": 20, "bbox_list": [ [ 262.96, 141.1, 367.69, 403.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle.", "normal_caption": "middle", "solution": [ 262.96, 141.1, 368.69, 404.96 ], "normalized_solution": [ 438, 334, 614, 959 ] }, { "height": 422, "width": 600, "id": 806, "original_id": 62460, "dataset_name": "refcoco", "area": 15997.72345, "iscrowd": 0, "image_id": 806, "category_id": 20, "bbox_list": [ [ 262.96, 141.1, 367.69, 403.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black lamb.", "normal_caption": "black lamb", "solution": [ 262.96, 141.1, 368.69, 404.96 ], "normalized_solution": [ 438, 334, 614, 959 ] }, { "height": 422, "width": 600, "id": 807, "original_id": 61407, "dataset_name": "refcoco", "area": 15937.065200000006, "iscrowd": 0, "image_id": 807, "category_id": 20, "bbox_list": [ [ 367.42, 156.12, 506.92, 394.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sheep on right.", "normal_caption": "sheep on right", "solution": [ 367.42, 156.12, 507.92, 395.53 ], "normalized_solution": [ 612, 369, 846, 937 ] }, { "height": 422, "width": 600, "id": 808, "original_id": 61407, "dataset_name": "refcoco", "area": 15937.065200000006, "iscrowd": 0, "image_id": 808, "category_id": 20, "bbox_list": [ [ 367.42, 156.12, 506.92, 394.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578154.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right goat all fluffy and cute.", "normal_caption": "right goat all fluffy and cute", "solution": [ 367.42, 156.12, 507.92, 395.53 ], "normalized_solution": [ 612, 369, 846, 937 ] }, { "height": 480, "width": 640, "id": 809, "original_id": 1223887, "dataset_name": "refcoco", "area": 20933.590799999994, "iscrowd": 0, "image_id": 809, "category_id": 1, "bbox_list": [ [ 166.11, 89.53, 342.01, 334.46000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle man.", "normal_caption": "middle man", "solution": [ 166.11, 89.53, 343.01, 335.46 ], "normalized_solution": [ 259, 186, 535, 698 ] }, { "height": 480, "width": 640, "id": 810, "original_id": 1223887, "dataset_name": "refcoco", "area": 20933.590799999994, "iscrowd": 0, "image_id": 810, "category_id": 1, "bbox_list": [ [ 166.11, 89.53, 342.01, 334.46000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle guy.", "normal_caption": "middle guy", "solution": [ 166.11, 89.53, 343.01, 335.46 ], "normalized_solution": [ 259, 186, 535, 698 ] }, { "height": 480, "width": 640, "id": 811, "original_id": 1223887, "dataset_name": "refcoco", "area": 20933.590799999994, "iscrowd": 0, "image_id": 811, "category_id": 1, "bbox_list": [ [ 166.11, 89.53, 342.01, 334.46000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in the middle.", "normal_caption": "guy in the middle", "solution": [ 166.11, 89.53, 343.01, 335.46 ], "normalized_solution": [ 259, 186, 535, 698 ] }, { "height": 480, "width": 640, "id": 812, "original_id": 1103507, "dataset_name": "refcoco", "area": 18190.408499999998, "iscrowd": 0, "image_id": 812, "category_id": 73, "bbox_list": [ [ 53.93, 239.46, 226.6, 381.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: leftmost laptop.", "normal_caption": "leftmost laptop", "solution": [ 53.93, 239.46, 227.6, 382.92 ], "normalized_solution": [ 84, 498, 355, 797 ] }, { "height": 480, "width": 640, "id": 813, "original_id": 1103507, "dataset_name": "refcoco", "area": 18190.408499999998, "iscrowd": 0, "image_id": 813, "category_id": 73, "bbox_list": [ [ 53.93, 239.46, 226.6, 381.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left laptop.", "normal_caption": "left laptop", "solution": [ 53.93, 239.46, 227.6, 382.92 ], "normalized_solution": [ 84, 498, 355, 797 ] }, { "height": 480, "width": 640, "id": 814, "original_id": 1103507, "dataset_name": "refcoco", "area": 18190.408499999998, "iscrowd": 0, "image_id": 814, "category_id": 73, "bbox_list": [ [ 53.93, 239.46, 226.6, 381.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the laptop the guy on the left has.", "normal_caption": "the laptop the guy on the left has", "solution": [ 53.93, 239.46, 227.6, 382.92 ], "normalized_solution": [ 84, 498, 355, 797 ] }, { "height": 480, "width": 640, "id": 815, "original_id": 1100254, "dataset_name": "refcoco", "area": 16970.650449999997, "iscrowd": 0, "image_id": 815, "category_id": 73, "bbox_list": [ [ 442.25, 271.82, 614.91, 374.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: laptop farthest right.", "normal_caption": "laptop farthest right", "solution": [ 442.25, 271.82, 615.91, 375.37 ], "normalized_solution": [ 691, 566, 962, 782 ] }, { "height": 480, "width": 640, "id": 816, "original_id": 1100254, "dataset_name": "refcoco", "area": 16970.650449999997, "iscrowd": 0, "image_id": 816, "category_id": 73, "bbox_list": [ [ 442.25, 271.82, 614.91, 374.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: apple laptop on right.", "normal_caption": "apple laptop on right", "solution": [ 442.25, 271.82, 615.91, 375.37 ], "normalized_solution": [ 691, 566, 962, 782 ] }, { "height": 480, "width": 640, "id": 817, "original_id": 1100254, "dataset_name": "refcoco", "area": 16970.650449999997, "iscrowd": 0, "image_id": 817, "category_id": 73, "bbox_list": [ [ 442.25, 271.82, 614.91, 374.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right laptop.", "normal_caption": "right laptop", "solution": [ 442.25, 271.82, 615.91, 375.37 ], "normalized_solution": [ 691, 566, 962, 782 ] }, { "height": 480, "width": 640, "id": 818, "original_id": 1737375, "dataset_name": "refcoco", "area": 35132.97839999999, "iscrowd": 0, "image_id": 818, "category_id": 1, "bbox_list": [ [ 392.3, 111.21, 639.0, 471.69 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on a computer.", "normal_caption": "man on a computer", "solution": [ 392.3, 111.21, 640.0, 472.69 ], "normalized_solution": [ 612, 231, 1000, 984 ] }, { "height": 480, "width": 640, "id": 819, "original_id": 1737375, "dataset_name": "refcoco", "area": 35132.97839999999, "iscrowd": 0, "image_id": 819, "category_id": 1, "bbox_list": [ [ 392.3, 111.21, 639.0, 471.69 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person on right.", "normal_caption": "person on right", "solution": [ 392.3, 111.21, 640.0, 472.69 ], "normalized_solution": [ 612, 231, 1000, 984 ] }, { "height": 480, "width": 640, "id": 820, "original_id": 1737375, "dataset_name": "refcoco", "area": 35132.97839999999, "iscrowd": 0, "image_id": 820, "category_id": 1, "bbox_list": [ [ 392.3, 111.21, 639.0, 471.69 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on the right.", "normal_caption": "man on the right", "solution": [ 392.3, 111.21, 640.0, 472.69 ], "normalized_solution": [ 612, 231, 1000, 984 ] }, { "height": 480, "width": 640, "id": 821, "original_id": 505905, "dataset_name": "refcoco", "area": 45372.0957, "iscrowd": 0, "image_id": 821, "category_id": 1, "bbox_list": [ [ 2.15, 79.39, 183.70000000000002, 473.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left person.", "normal_caption": "left person", "solution": [ 2.15, 79.39, 184.7, 474.56 ], "normalized_solution": [ 3, 165, 288, 988 ] }, { "height": 480, "width": 640, "id": 822, "original_id": 505905, "dataset_name": "refcoco", "area": 45372.0957, "iscrowd": 0, "image_id": 822, "category_id": 1, "bbox_list": [ [ 2.15, 79.39, 183.70000000000002, 473.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left dude.", "normal_caption": "left dude", "solution": [ 2.15, 79.39, 184.7, 474.56 ], "normalized_solution": [ 3, 165, 288, 988 ] }, { "height": 480, "width": 640, "id": 823, "original_id": 505905, "dataset_name": "refcoco", "area": 45372.0957, "iscrowd": 0, "image_id": 823, "category_id": 1, "bbox_list": [ [ 2.15, 79.39, 183.70000000000002, 473.56 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578128.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left person.", "normal_caption": "left person", "solution": [ 2.15, 79.39, 184.7, 474.56 ], "normalized_solution": [ 3, 165, 288, 988 ] }, { "height": 426, "width": 640, "id": 824, "original_id": 50412, "dataset_name": "refcoco", "area": 15769.08875, "iscrowd": 0, "image_id": 824, "category_id": 17, "bbox_list": [ [ 132.84, 116.35, 437.83000000000004, 219.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cat in back.", "normal_caption": "cat in back", "solution": [ 132.84, 116.35, 438.83, 220.79 ], "normalized_solution": [ 207, 273, 685, 518 ] }, { "height": 426, "width": 640, "id": 825, "original_id": 50412, "dataset_name": "refcoco", "area": 15769.08875, "iscrowd": 0, "image_id": 825, "category_id": 17, "bbox_list": [ [ 132.84, 116.35, 437.83000000000004, 219.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: gray cat.", "normal_caption": "gray cat", "solution": [ 132.84, 116.35, 438.83, 220.79 ], "normalized_solution": [ 207, 273, 685, 518 ] }, { "height": 426, "width": 640, "id": 826, "original_id": 50412, "dataset_name": "refcoco", "area": 15769.08875, "iscrowd": 0, "image_id": 826, "category_id": 17, "bbox_list": [ [ 132.84, 116.35, 437.83000000000004, 219.79 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far cat.", "normal_caption": "far cat", "solution": [ 132.84, 116.35, 438.83, 220.79 ], "normalized_solution": [ 207, 273, 685, 518 ] }, { "height": 426, "width": 640, "id": 827, "original_id": 50186, "dataset_name": "refcoco", "area": 49849.93470000001, "iscrowd": 0, "image_id": 827, "category_id": 17, "bbox_list": [ [ 120.01, 189.87, 488.21, 358.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front cat.", "normal_caption": "front cat", "solution": [ 120.01, 189.87, 489.21, 359.35 ], "normalized_solution": [ 187, 445, 764, 843 ] }, { "height": 426, "width": 640, "id": 828, "original_id": 50186, "dataset_name": "refcoco", "area": 49849.93470000001, "iscrowd": 0, "image_id": 828, "category_id": 17, "bbox_list": [ [ 120.01, 189.87, 488.21, 358.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front cat.", "normal_caption": "front cat", "solution": [ 120.01, 189.87, 489.21, 359.35 ], "normalized_solution": [ 187, 445, 764, 843 ] }, { "height": 426, "width": 640, "id": 829, "original_id": 50186, "dataset_name": "refcoco", "area": 49849.93470000001, "iscrowd": 0, "image_id": 829, "category_id": 17, "bbox_list": [ [ 120.01, 189.87, 488.21, 358.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578108.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black and gray cat.", "normal_caption": "black and gray cat", "solution": [ 120.01, 189.87, 489.21, 359.35 ], "normalized_solution": [ 187, 445, 764, 843 ] }, { "height": 612, "width": 612, "id": 830, "original_id": 522925, "dataset_name": "refcoco", "area": 13765.260200000002, "iscrowd": 0, "image_id": 830, "category_id": 1, "bbox_list": [ [ 135.05, 440.7, 246.46, 611.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578070.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink girl.", "normal_caption": "pink girl", "solution": [ 135.05, 440.7, 247.46, 612.0 ], "normalized_solution": [ 220, 720, 404, 1000 ] }, { "height": 612, "width": 612, "id": 831, "original_id": 522925, "dataset_name": "refcoco", "area": 13765.260200000002, "iscrowd": 0, "image_id": 831, "category_id": 1, "bbox_list": [ [ 135.05, 440.7, 246.46, 611.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578070.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in pink.", "normal_caption": "girl in pink", "solution": [ 135.05, 440.7, 247.46, 612.0 ], "normalized_solution": [ 220, 720, 404, 1000 ] }, { "height": 612, "width": 612, "id": 832, "original_id": 522925, "dataset_name": "refcoco", "area": 13765.260200000002, "iscrowd": 0, "image_id": 832, "category_id": 1, "bbox_list": [ [ 135.05, 440.7, 246.46, 611.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578070.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in pink.", "normal_caption": "girl in pink", "solution": [ 135.05, 440.7, 247.46, 612.0 ], "normalized_solution": [ 220, 720, 404, 1000 ] }, { "height": 612, "width": 612, "id": 833, "original_id": 518413, "dataset_name": "refcoco", "area": 13558.432099999998, "iscrowd": 0, "image_id": 833, "category_id": 1, "bbox_list": [ [ 254.43, 413.96, 357.95, 604.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578070.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl in front blue shirt and hat.", "normal_caption": "girl in front blue shirt and hat", "solution": [ 254.43, 413.96, 358.95, 605.12 ], "normalized_solution": [ 415, 676, 586, 988 ] }, { "height": 612, "width": 612, "id": 834, "original_id": 518413, "dataset_name": "refcoco", "area": 13558.432099999998, "iscrowd": 0, "image_id": 834, "category_id": 1, "bbox_list": [ [ 254.43, 413.96, 357.95, 604.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578070.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: in blue front.", "normal_caption": "in blue front", "solution": [ 254.43, 413.96, 358.95, 605.12 ], "normalized_solution": [ 415, 676, 586, 988 ] }, { "height": 612, "width": 612, "id": 835, "original_id": 518413, "dataset_name": "refcoco", "area": 13558.432099999998, "iscrowd": 0, "image_id": 835, "category_id": 1, "bbox_list": [ [ 254.43, 413.96, 357.95, 604.12 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578070.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person in blue bottom middle.", "normal_caption": "person in blue bottom middle", "solution": [ 254.43, 413.96, 358.95, 605.12 ], "normalized_solution": [ 415, 676, 586, 988 ] }, { "height": 480, "width": 640, "id": 836, "original_id": 2119723, "dataset_name": "refcoco", "area": 11449.054000000006, "iscrowd": 0, "image_id": 836, "category_id": 61, "bbox_list": [ [ 341.7, 183.32, 479.26, 339.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right half of sandwich.", "normal_caption": "right half of sandwich", "solution": [ 341.7, 183.32, 480.26, 340.65 ], "normalized_solution": [ 533, 381, 750, 709 ] }, { "height": 480, "width": 640, "id": 837, "original_id": 2119723, "dataset_name": "refcoco", "area": 11449.054000000006, "iscrowd": 0, "image_id": 837, "category_id": 61, "bbox_list": [ [ 341.7, 183.32, 479.26, 339.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right sandwich.", "normal_caption": "right sandwich", "solution": [ 341.7, 183.32, 480.26, 340.65 ], "normalized_solution": [ 533, 381, 750, 709 ] }, { "height": 480, "width": 640, "id": 838, "original_id": 2119723, "dataset_name": "refcoco", "area": 11449.054000000006, "iscrowd": 0, "image_id": 838, "category_id": 61, "bbox_list": [ [ 341.7, 183.32, 479.26, 339.65 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the triangle food on the right.", "normal_caption": "the triangle food on the right", "solution": [ 341.7, 183.32, 480.26, 340.65 ], "normalized_solution": [ 533, 381, 750, 709 ] }, { "height": 480, "width": 640, "id": 839, "original_id": 2119292, "dataset_name": "refcoco", "area": 17850.64925, "iscrowd": 0, "image_id": 839, "category_id": 61, "bbox_list": [ [ 211.2, 169.24, 349.91999999999996, 354.15999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: cheese part of sandwich.", "normal_caption": "cheese part of sandwich", "solution": [ 211.2, 169.24, 350.92, 355.16 ], "normalized_solution": [ 329, 352, 548, 739 ] }, { "height": 480, "width": 640, "id": 840, "original_id": 2119292, "dataset_name": "refcoco", "area": 17850.64925, "iscrowd": 0, "image_id": 840, "category_id": 61, "bbox_list": [ [ 211.2, 169.24, 349.91999999999996, 354.15999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left corner sandwich.", "normal_caption": "left corner sandwich", "solution": [ 211.2, 169.24, 350.92, 355.16 ], "normalized_solution": [ 329, 352, 548, 739 ] }, { "height": 480, "width": 640, "id": 841, "original_id": 2119292, "dataset_name": "refcoco", "area": 17850.64925, "iscrowd": 0, "image_id": 841, "category_id": 61, "bbox_list": [ [ 211.2, 169.24, 349.91999999999996, 354.15999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left side trianangle thingy on plate.", "normal_caption": "left side trianangle thingy on plate", "solution": [ 211.2, 169.24, 350.92, 355.16 ], "normalized_solution": [ 329, 352, 548, 739 ] }, { "height": 480, "width": 640, "id": 842, "original_id": 2119147, "dataset_name": "refcoco", "area": 14477.320600000003, "iscrowd": 0, "image_id": 842, "category_id": 61, "bbox_list": [ [ 366.94, 259.49, 521.61, 386.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pastry on bottom right of plate.", "normal_caption": "pastry on bottom right of plate", "solution": [ 366.94, 259.49, 522.61, 387.77 ], "normalized_solution": [ 573, 540, 816, 807 ] }, { "height": 480, "width": 640, "id": 843, "original_id": 2119147, "dataset_name": "refcoco", "area": 14477.320600000003, "iscrowd": 0, "image_id": 843, "category_id": 61, "bbox_list": [ [ 366.94, 259.49, 521.61, 386.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: nasty muffin right.", "normal_caption": "nasty muffin right", "solution": [ 366.94, 259.49, 522.61, 387.77 ], "normalized_solution": [ 573, 540, 816, 807 ] }, { "height": 480, "width": 640, "id": 844, "original_id": 2119147, "dataset_name": "refcoco", "area": 14477.320600000003, "iscrowd": 0, "image_id": 844, "category_id": 61, "bbox_list": [ [ 366.94, 259.49, 521.61, 386.77 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578063.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: round cake on plate.", "normal_caption": "round cake on plate", "solution": [ 366.94, 259.49, 522.61, 387.77 ], "normalized_solution": [ 573, 540, 816, 807 ] }, { "height": 436, "width": 640, "id": 845, "original_id": 1729682, "dataset_name": "refcoco", "area": 12721.699249999996, "iscrowd": 0, "image_id": 845, "category_id": 1, "bbox_list": [ [ 474.21, 157.74, 562.37, 413.44 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578056.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second from the right man.", "normal_caption": "second from the right man", "solution": [ 474.21, 157.74, 563.37, 414.44 ], "normalized_solution": [ 740, 361, 880, 950 ] }, { "height": 436, "width": 640, "id": 846, "original_id": 1729682, "dataset_name": "refcoco", "area": 12721.699249999996, "iscrowd": 0, "image_id": 846, "category_id": 1, "bbox_list": [ [ 474.21, 157.74, 562.37, 413.44 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578056.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy second from right.", "normal_caption": "guy second from right", "solution": [ 474.21, 157.74, 563.37, 414.44 ], "normalized_solution": [ 740, 361, 880, 950 ] }, { "height": 436, "width": 640, "id": 847, "original_id": 1729682, "dataset_name": "refcoco", "area": 12721.699249999996, "iscrowd": 0, "image_id": 847, "category_id": 1, "bbox_list": [ [ 474.21, 157.74, 562.37, 413.44 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578056.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second guy right to left.", "normal_caption": "second guy right to left", "solution": [ 474.21, 157.74, 563.37, 414.44 ], "normalized_solution": [ 740, 361, 880, 950 ] }, { "height": 436, "width": 640, "id": 848, "original_id": 224910, "dataset_name": "refcoco", "area": 11797.994899999994, "iscrowd": 0, "image_id": 848, "category_id": 1, "bbox_list": [ [ 553.57, 168.24, 630.96, 413.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578056.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man on far right.", "normal_caption": "man on far right", "solution": [ 553.57, 168.24, 631.96, 414.17 ], "normalized_solution": [ 864, 385, 987, 949 ] }, { "height": 436, "width": 640, "id": 849, "original_id": 224910, "dataset_name": "refcoco", "area": 11797.994899999994, "iscrowd": 0, "image_id": 849, "category_id": 1, "bbox_list": [ [ 553.57, 168.24, 630.96, 413.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578056.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man to the very right.", "normal_caption": "man to the very right", "solution": [ 553.57, 168.24, 631.96, 414.17 ], "normalized_solution": [ 864, 385, 987, 949 ] }, { "height": 436, "width": 640, "id": 850, "original_id": 224910, "dataset_name": "refcoco", "area": 11797.994899999994, "iscrowd": 0, "image_id": 850, "category_id": 1, "bbox_list": [ [ 553.57, 168.24, 630.96, 413.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578056.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy far right.", "normal_caption": "guy far right", "solution": [ 553.57, 168.24, 631.96, 414.17 ], "normalized_solution": [ 864, 385, 987, 949 ] }, { "height": 480, "width": 640, "id": 851, "original_id": 2218492, "dataset_name": "refcoco", "area": 38081.507499999985, "iscrowd": 0, "image_id": 851, "category_id": 54, "bbox_list": [ [ 357.93, 123.26, 639.0, 345.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578046.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right piece of food.", "normal_caption": "right piece of food", "solution": [ 357.93, 123.26, 640.0, 346.07 ], "normalized_solution": [ 559, 256, 1000, 720 ] }, { "height": 480, "width": 640, "id": 852, "original_id": 2218492, "dataset_name": "refcoco", "area": 38081.507499999985, "iscrowd": 0, "image_id": 852, "category_id": 54, "bbox_list": [ [ 357.93, 123.26, 639.0, 345.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578046.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right piece.", "normal_caption": "right piece", "solution": [ 357.93, 123.26, 640.0, 346.07 ], "normalized_solution": [ 559, 256, 1000, 720 ] }, { "height": 480, "width": 640, "id": 853, "original_id": 1909063, "dataset_name": "refcoco", "area": 33391.943999999996, "iscrowd": 0, "image_id": 853, "category_id": 54, "bbox_list": [ [ 122.34, 124.85, 385.57000000000005, 340.48 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578046.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: piece on left.", "normal_caption": "piece on left", "solution": [ 122.34, 124.85, 386.57, 341.48 ], "normalized_solution": [ 191, 260, 604, 711 ] }, { "height": 480, "width": 640, "id": 854, "original_id": 1909063, "dataset_name": "refcoco", "area": 33391.943999999996, "iscrowd": 0, "image_id": 854, "category_id": 54, "bbox_list": [ [ 122.34, 124.85, 385.57000000000005, 340.48 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578046.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: sandwich on left near fork.", "normal_caption": "sandwich on left near fork", "solution": [ 122.34, 124.85, 386.57, 341.48 ], "normalized_solution": [ 191, 260, 604, 711 ] }, { "height": 427, "width": 640, "id": 855, "original_id": 462653, "dataset_name": "refcoco", "area": 11829.26075, "iscrowd": 0, "image_id": 855, "category_id": 1, "bbox_list": [ [ 549.37, 73.72, 630.9300000000001, 308.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man at far right with yellow shirt.", "normal_caption": "man at far right with yellow shirt", "solution": [ 549.37, 73.72, 631.93, 309.01 ], "normalized_solution": [ 858, 172, 987, 723 ] }, { "height": 427, "width": 640, "id": 856, "original_id": 462653, "dataset_name": "refcoco", "area": 11829.26075, "iscrowd": 0, "image_id": 856, "category_id": 1, "bbox_list": [ [ 549.37, 73.72, 630.9300000000001, 308.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in yellow.", "normal_caption": "man in yellow", "solution": [ 549.37, 73.72, 631.93, 309.01 ], "normalized_solution": [ 858, 172, 987, 723 ] }, { "height": 427, "width": 640, "id": 857, "original_id": 462653, "dataset_name": "refcoco", "area": 11829.26075, "iscrowd": 0, "image_id": 857, "category_id": 1, "bbox_list": [ [ 549.37, 73.72, 630.9300000000001, 308.01 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange shirt.", "normal_caption": "orange shirt", "solution": [ 549.37, 73.72, 631.93, 309.01 ], "normalized_solution": [ 858, 172, 987, 723 ] }, { "height": 427, "width": 640, "id": 858, "original_id": 460135, "dataset_name": "refcoco", "area": 10569.2877, "iscrowd": 0, "image_id": 858, "category_id": 1, "bbox_list": [ [ 462.56, 83.03, 540.97, 315.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy in black shirt next to yello shirt guy.", "normal_caption": "guy in black shirt next to yello shirt guy", "solution": [ 462.56, 83.03, 541.97, 316.22 ], "normalized_solution": [ 722, 194, 846, 740 ] }, { "height": 427, "width": 640, "id": 859, "original_id": 460135, "dataset_name": "refcoco", "area": 10569.2877, "iscrowd": 0, "image_id": 859, "category_id": 1, "bbox_list": [ [ 462.56, 83.03, 540.97, 315.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: ahh you where off like one pixel lol dude on right black shirt.", "normal_caption": "ahh you where off like one pixel lol dude on right black shirt", "solution": [ 462.56, 83.03, 541.97, 316.22 ], "normalized_solution": [ 722, 194, 846, 740 ] }, { "height": 427, "width": 640, "id": 860, "original_id": 460135, "dataset_name": "refcoco", "area": 10569.2877, "iscrowd": 0, "image_id": 860, "category_id": 1, "bbox_list": [ [ 462.56, 83.03, 540.97, 315.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: dude black shirt.", "normal_caption": "dude black shirt", "solution": [ 462.56, 83.03, 541.97, 316.22 ], "normalized_solution": [ 722, 194, 846, 740 ] }, { "height": 427, "width": 640, "id": 861, "original_id": 430836, "dataset_name": "refcoco", "area": 18307.1285, "iscrowd": 0, "image_id": 861, "category_id": 1, "bbox_list": [ [ 244.14, 61.27, 341.75, 381.96 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man in tank top skate boarding.", "normal_caption": "man in tank top skate boarding", "solution": [ 244.14, 61.27, 342.75, 382.96 ], "normalized_solution": [ 381, 143, 535, 896 ] }, { "height": 427, "width": 640, "id": 862, "original_id": 430836, "dataset_name": "refcoco", "area": 18307.1285, "iscrowd": 0, "image_id": 862, "category_id": 1, "bbox_list": [ [ 244.14, 61.27, 341.75, 381.96 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: skateboarder.", "normal_caption": "skateboarder", "solution": [ 244.14, 61.27, 342.75, 382.96 ], "normalized_solution": [ 381, 143, 535, 896 ] }, { "height": 427, "width": 640, "id": 863, "original_id": 430836, "dataset_name": "refcoco", "area": 18307.1285, "iscrowd": 0, "image_id": 863, "category_id": 1, "bbox_list": [ [ 244.14, 61.27, 341.75, 381.96 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578037.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: skateboarder.", "normal_caption": "skateboarder", "solution": [ 244.14, 61.27, 342.75, 382.96 ], "normalized_solution": [ 381, 143, 535, 896 ] }, { "height": 448, "width": 500, "id": 864, "original_id": 1841768, "dataset_name": "refcoco", "area": 44240.63309999999, "iscrowd": 0, "image_id": 864, "category_id": 33, "bbox_list": [ [ 306.04, 165.24, 498.20000000000005, 436.53000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: click on the word right.", "normal_caption": "click on the word right", "solution": [ 306.04, 165.24, 499.2, 437.53 ], "normalized_solution": [ 612, 368, 998, 976 ] }, { "height": 448, "width": 500, "id": 865, "original_id": 1841768, "dataset_name": "refcoco", "area": 44240.63309999999, "iscrowd": 0, "image_id": 865, "category_id": 33, "bbox_list": [ [ 306.04, 165.24, 498.20000000000005, 436.53000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right bottom.", "normal_caption": "right bottom", "solution": [ 306.04, 165.24, 499.2, 437.53 ], "normalized_solution": [ 612, 368, 998, 976 ] }, { "height": 448, "width": 500, "id": 866, "original_id": 1841768, "dataset_name": "refcoco", "area": 44240.63309999999, "iscrowd": 0, "image_id": 866, "category_id": 33, "bbox_list": [ [ 306.04, 165.24, 498.20000000000005, 436.53000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom right back.", "normal_caption": "bottom right back", "solution": [ 306.04, 165.24, 499.2, 437.53 ], "normalized_solution": [ 612, 368, 998, 976 ] }, { "height": 448, "width": 500, "id": 867, "original_id": 1187604, "dataset_name": "refcoco", "area": 26846.32165, "iscrowd": 0, "image_id": 867, "category_id": 33, "bbox_list": [ [ 156.97, 259.19, 310.68, 447.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: suitcase on the bottom center with three items in it.", "normal_caption": "suitcase on the bottom center with three items in it", "solution": [ 156.97, 259.19, 311.68, 448.0 ], "normalized_solution": [ 313, 578, 623, 1000 ] }, { "height": 448, "width": 500, "id": 868, "original_id": 1187604, "dataset_name": "refcoco", "area": 26846.32165, "iscrowd": 0, "image_id": 868, "category_id": 33, "bbox_list": [ [ 156.97, 259.19, 310.68, 447.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle blue luggage.", "normal_caption": "middle blue luggage", "solution": [ 156.97, 259.19, 311.68, 448.0 ], "normalized_solution": [ 313, 578, 623, 1000 ] }, { "height": 448, "width": 500, "id": 869, "original_id": 1187604, "dataset_name": "refcoco", "area": 26846.32165, "iscrowd": 0, "image_id": 869, "category_id": 33, "bbox_list": [ [ 156.97, 259.19, 310.68, 447.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: very.", "normal_caption": "very", "solution": [ 156.97, 259.19, 311.68, 448.0 ], "normalized_solution": [ 313, 578, 623, 1000 ] }, { "height": 448, "width": 500, "id": 870, "original_id": 1186471, "dataset_name": "refcoco", "area": 31876.645450000004, "iscrowd": 0, "image_id": 870, "category_id": 33, "bbox_list": [ [ 1.01, 34.06, 185.25, 225.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left bag.", "normal_caption": "top left bag", "solution": [ 1.01, 34.06, 186.25, 226.35 ], "normalized_solution": [ 2, 76, 372, 505 ] }, { "height": 448, "width": 500, "id": 871, "original_id": 1186471, "dataset_name": "refcoco", "area": 31876.645450000004, "iscrowd": 0, "image_id": 871, "category_id": 33, "bbox_list": [ [ 1.01, 34.06, 185.25, 225.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: upper left kuggage.", "normal_caption": "upper left kuggage", "solution": [ 1.01, 34.06, 186.25, 226.35 ], "normalized_solution": [ 2, 76, 372, 505 ] }, { "height": 448, "width": 500, "id": 872, "original_id": 1186471, "dataset_name": "refcoco", "area": 31876.645450000004, "iscrowd": 0, "image_id": 872, "category_id": 33, "bbox_list": [ [ 1.01, 34.06, 185.25, 225.35 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top left luggage.", "normal_caption": "top left luggage", "solution": [ 1.01, 34.06, 186.25, 226.35 ], "normalized_solution": [ 2, 76, 372, 505 ] }, { "height": 448, "width": 500, "id": 873, "original_id": 1186166, "dataset_name": "refcoco", "area": 28457.8688, "iscrowd": 0, "image_id": 873, "category_id": 33, "bbox_list": [ [ 171.53, 36.83, 331.97, 246.70999999999998 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top center clothes.", "normal_caption": "top center clothes", "solution": [ 171.53, 36.83, 332.97, 247.71 ], "normalized_solution": [ 343, 82, 665, 552 ] }, { "height": 448, "width": 500, "id": 874, "original_id": 1186166, "dataset_name": "refcoco", "area": 28457.8688, "iscrowd": 0, "image_id": 874, "category_id": 33, "bbox_list": [ [ 171.53, 36.83, 331.97, 246.70999999999998 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle blue open bag top.", "normal_caption": "middle blue open bag top", "solution": [ 171.53, 36.83, 332.97, 247.71 ], "normalized_solution": [ 343, 82, 665, 552 ] }, { "height": 448, "width": 500, "id": 875, "original_id": 1186166, "dataset_name": "refcoco", "area": 28457.8688, "iscrowd": 0, "image_id": 875, "category_id": 33, "bbox_list": [ [ 171.53, 36.83, 331.97, 246.70999999999998 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top center section.", "normal_caption": "top center section", "solution": [ 171.53, 36.83, 332.97, 247.71 ], "normalized_solution": [ 343, 82, 665, 552 ] }, { "height": 448, "width": 500, "id": 876, "original_id": 1185061, "dataset_name": "refcoco", "area": 24532.900700000002, "iscrowd": 0, "image_id": 876, "category_id": 33, "bbox_list": [ [ 322.98, 0.53, 472.09000000000003, 202.78 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: luggage top right pink tag.", "normal_caption": "luggage top right pink tag", "solution": [ 322.98, 0.53, 473.09, 203.78 ], "normalized_solution": [ 645, 1, 946, 454 ] }, { "height": 448, "width": 500, "id": 877, "original_id": 1185061, "dataset_name": "refcoco", "area": 24532.900700000002, "iscrowd": 0, "image_id": 877, "category_id": 33, "bbox_list": [ [ 322.98, 0.53, 472.09000000000003, 202.78 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: closed suitcase top right.", "normal_caption": "closed suitcase top right", "solution": [ 322.98, 0.53, 473.09, 203.78 ], "normalized_solution": [ 645, 1, 946, 454 ] }, { "height": 448, "width": 500, "id": 878, "original_id": 1185061, "dataset_name": "refcoco", "area": 24532.900700000002, "iscrowd": 0, "image_id": 878, "category_id": 33, "bbox_list": [ [ 322.98, 0.53, 472.09000000000003, 202.78 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000578009.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: closed suitcase handle top right.", "normal_caption": "closed suitcase handle top right", "solution": [ 322.98, 0.53, 473.09, 203.78 ], "normalized_solution": [ 645, 1, 946, 454 ] }, { "height": 474, "width": 640, "id": 879, "original_id": 1745040, "dataset_name": "refcoco", "area": 10621.392100000001, "iscrowd": 0, "image_id": 879, "category_id": 1, "bbox_list": [ [ 474.0, 221.16, 639.0, 436.03999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577953.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: catcher.", "normal_caption": "catcher", "solution": [ 474.0, 221.16, 640.0, 437.04 ], "normalized_solution": [ 740, 466, 1000, 922 ] }, { "height": 474, "width": 640, "id": 880, "original_id": 1745040, "dataset_name": "refcoco", "area": 10621.392100000001, "iscrowd": 0, "image_id": 880, "category_id": 1, "bbox_list": [ [ 474.0, 221.16, 639.0, 436.03999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577953.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: catcher.", "normal_caption": "catcher", "solution": [ 474.0, 221.16, 640.0, 437.04 ], "normalized_solution": [ 740, 466, 1000, 922 ] }, { "height": 474, "width": 640, "id": 881, "original_id": 1251595, "dataset_name": "refcoco", "area": 37837.09744999999, "iscrowd": 0, "image_id": 881, "category_id": 1, "bbox_list": [ [ 185.34, 113.97, 481.52, 463.40999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577953.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: batter.", "normal_caption": "batter", "solution": [ 185.34, 113.97, 482.52, 464.41 ], "normalized_solution": [ 289, 240, 753, 979 ] }, { "height": 474, "width": 640, "id": 882, "original_id": 1251595, "dataset_name": "refcoco", "area": 37837.09744999999, "iscrowd": 0, "image_id": 882, "category_id": 1, "bbox_list": [ [ 185.34, 113.97, 481.52, 463.40999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577953.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: batter.", "normal_caption": "batter", "solution": [ 185.34, 113.97, 482.52, 464.41 ], "normalized_solution": [ 289, 240, 753, 979 ] }, { "height": 474, "width": 640, "id": 883, "original_id": 1251595, "dataset_name": "refcoco", "area": 37837.09744999999, "iscrowd": 0, "image_id": 883, "category_id": 1, "bbox_list": [ [ 185.34, 113.97, 481.52, 463.40999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577953.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: batter.", "normal_caption": "batter", "solution": [ 185.34, 113.97, 482.52, 464.41 ], "normalized_solution": [ 289, 240, 753, 979 ] }, { "height": 429, "width": 640, "id": 884, "original_id": 1058466, "dataset_name": "refcoco", "area": 18784.425400000004, "iscrowd": 0, "image_id": 884, "category_id": 56, "bbox_list": [ [ 363.29, 205.41, 639.0, 297.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577948.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccoli in focus right.", "normal_caption": "broccoli in focus right", "solution": [ 363.29, 205.41, 640.0, 298.21 ], "normalized_solution": [ 567, 478, 1000, 695 ] }, { "height": 429, "width": 640, "id": 885, "original_id": 1058466, "dataset_name": "refcoco", "area": 18784.425400000004, "iscrowd": 0, "image_id": 885, "category_id": 56, "bbox_list": [ [ 363.29, 205.41, 639.0, 297.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577948.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broc laying sideways next to the chicken fun game have a good one.", "normal_caption": "broc laying sideways next to the chicken fun game have a good one", "solution": [ 363.29, 205.41, 640.0, 298.21 ], "normalized_solution": [ 567, 478, 1000, 695 ] }, { "height": 429, "width": 640, "id": 886, "original_id": 1058466, "dataset_name": "refcoco", "area": 18784.425400000004, "iscrowd": 0, "image_id": 886, "category_id": 56, "bbox_list": [ [ 363.29, 205.41, 639.0, 297.21 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577948.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: broccoli on its side toward the front.", "normal_caption": "broccoli on its side toward the front", "solution": [ 363.29, 205.41, 640.0, 298.21 ], "normalized_solution": [ 567, 478, 1000, 695 ] }, { "height": 500, "width": 375, "id": 887, "original_id": 460061, "dataset_name": "refcoco", "area": 13160.127700000005, "iscrowd": 0, "image_id": 887, "category_id": 1, "bbox_list": [ [ 151.69, 157.38, 279.9, 424.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577907.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy on right.", "normal_caption": "guy on right", "solution": [ 151.69, 157.38, 280.9, 425.92 ], "normalized_solution": [ 404, 314, 749, 851 ] }, { "height": 500, "width": 375, "id": 888, "original_id": 460061, "dataset_name": "refcoco", "area": 13160.127700000005, "iscrowd": 0, "image_id": 888, "category_id": 1, "bbox_list": [ [ 151.69, 157.38, 279.9, 424.92 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577907.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy with gray shirt skier.", "normal_caption": "guy with gray shirt skier", "solution": [ 151.69, 157.38, 280.9, 425.92 ], "normalized_solution": [ 404, 314, 749, 851 ] }, { "height": 480, "width": 640, "id": 889, "original_id": 462595, "dataset_name": "refcoco", "area": 10995.355200000004, "iscrowd": 0, "image_id": 889, "category_id": 1, "bbox_list": [ [ 443.9, 246.77, 527.97, 449.15999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: little girl.", "normal_caption": "little girl", "solution": [ 443.9, 246.77, 528.97, 450.16 ], "normalized_solution": [ 693, 514, 826, 937 ] }, { "height": 480, "width": 640, "id": 890, "original_id": 462595, "dataset_name": "refcoco", "area": 10995.355200000004, "iscrowd": 0, "image_id": 890, "category_id": 1, "bbox_list": [ [ 443.9, 246.77, 527.97, 449.15999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: little girl.", "normal_caption": "little girl", "solution": [ 443.9, 246.77, 528.97, 450.16 ], "normalized_solution": [ 693, 514, 826, 937 ] }, { "height": 480, "width": 640, "id": 891, "original_id": 462595, "dataset_name": "refcoco", "area": 10995.355200000004, "iscrowd": 0, "image_id": 891, "category_id": 1, "bbox_list": [ [ 443.9, 246.77, 527.97, 449.15999999999997 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: child in right.", "normal_caption": "child in right", "solution": [ 443.9, 246.77, 528.97, 450.16 ], "normalized_solution": [ 693, 514, 826, 937 ] }, { "height": 480, "width": 640, "id": 892, "original_id": 415358, "dataset_name": "refcoco", "area": 13345.957250000001, "iscrowd": 0, "image_id": 892, "category_id": 67, "bbox_list": [ [ 324.67, 197.21, 578.24, 276.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: table right above girls head.", "normal_caption": "table right above girls head", "solution": [ 324.67, 197.21, 579.24, 277.03 ], "normalized_solution": [ 507, 410, 905, 577 ] }, { "height": 480, "width": 640, "id": 893, "original_id": 415358, "dataset_name": "refcoco", "area": 13345.957250000001, "iscrowd": 0, "image_id": 893, "category_id": 67, "bbox_list": [ [ 324.67, 197.21, 578.24, 276.03 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: tabletop near little kids head.", "normal_caption": "tabletop near little kids head", "solution": [ 324.67, 197.21, 579.24, 277.03 ], "normalized_solution": [ 507, 410, 905, 577 ] }, { "height": 480, "width": 640, "id": 894, "original_id": 412991, "dataset_name": "refcoco", "area": 51538.67319999998, "iscrowd": 0, "image_id": 894, "category_id": 67, "bbox_list": [ [ 2.16, 320.36, 545.88, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: big table near us.", "normal_caption": "big table near us", "solution": [ 2.16, 320.36, 546.88, 473.53 ], "normalized_solution": [ 3, 667, 854, 986 ] }, { "height": 480, "width": 640, "id": 895, "original_id": 412991, "dataset_name": "refcoco", "area": 51538.67319999998, "iscrowd": 0, "image_id": 895, "category_id": 67, "bbox_list": [ [ 2.16, 320.36, 545.88, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: table.", "normal_caption": "table", "solution": [ 2.16, 320.36, 546.88, 473.53 ], "normalized_solution": [ 3, 667, 854, 986 ] }, { "height": 480, "width": 640, "id": 896, "original_id": 412991, "dataset_name": "refcoco", "area": 51538.67319999998, "iscrowd": 0, "image_id": 896, "category_id": 67, "bbox_list": [ [ 2.16, 320.36, 545.88, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom left.", "normal_caption": "bottom left", "solution": [ 2.16, 320.36, 546.88, 473.53 ], "normalized_solution": [ 3, 667, 854, 986 ] }, { "height": 480, "width": 640, "id": 897, "original_id": 2204710, "dataset_name": "refcoco", "area": 17317.4004, "iscrowd": 0, "image_id": 897, "category_id": 1, "bbox_list": [ [ 21.24, 104.46, 139.54, 365.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: looking at us tall.", "normal_caption": "looking at us tall", "solution": [ 21.24, 104.46, 140.54, 366.02 ], "normalized_solution": [ 33, 217, 219, 762 ] }, { "height": 480, "width": 640, "id": 898, "original_id": 2204710, "dataset_name": "refcoco", "area": 17317.4004, "iscrowd": 0, "image_id": 898, "category_id": 1, "bbox_list": [ [ 21.24, 104.46, 139.54, 365.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left lady.", "normal_caption": "left lady", "solution": [ 21.24, 104.46, 140.54, 366.02 ], "normalized_solution": [ 33, 217, 219, 762 ] }, { "height": 480, "width": 640, "id": 899, "original_id": 2204710, "dataset_name": "refcoco", "area": 17317.4004, "iscrowd": 0, "image_id": 899, "category_id": 1, "bbox_list": [ [ 21.24, 104.46, 139.54, 365.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577850.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 21.24, 104.46, 140.54, 366.02 ], "normalized_solution": [ 33, 217, 219, 762 ] }, { "height": 480, "width": 640, "id": 900, "original_id": 1278499, "dataset_name": "refcoco", "area": 19987.719950000002, "iscrowd": 0, "image_id": 900, "category_id": 1, "bbox_list": [ [ 424.99, 237.3, 592.26, 469.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577830.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman on right of picture.", "normal_caption": "woman on right of picture", "solution": [ 424.99, 237.3, 593.26, 470.29 ], "normalized_solution": [ 664, 494, 926, 979 ] }, { "height": 480, "width": 640, "id": 901, "original_id": 1278499, "dataset_name": "refcoco", "area": 19987.719950000002, "iscrowd": 0, "image_id": 901, "category_id": 1, "bbox_list": [ [ 424.99, 237.3, 592.26, 469.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577830.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl on right nearest us.", "normal_caption": "girl on right nearest us", "solution": [ 424.99, 237.3, 593.26, 470.29 ], "normalized_solution": [ 664, 494, 926, 979 ] }, { "height": 480, "width": 640, "id": 902, "original_id": 1278499, "dataset_name": "refcoco", "area": 19987.719950000002, "iscrowd": 0, "image_id": 902, "category_id": 1, "bbox_list": [ [ 424.99, 237.3, 592.26, 469.29 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577830.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right most woman.", "normal_caption": "right most woman", "solution": [ 424.99, 237.3, 593.26, 470.29 ], "normalized_solution": [ 664, 494, 926, 979 ] }, { "height": 480, "width": 640, "id": 903, "original_id": 1254377, "dataset_name": "refcoco", "area": 26215.070000000003, "iscrowd": 0, "image_id": 903, "category_id": 1, "bbox_list": [ [ 51.78, 225.44, 277.28999999999996, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577830.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left woman.", "normal_caption": "left woman", "solution": [ 51.78, 225.44, 278.29, 473.53 ], "normalized_solution": [ 80, 469, 434, 986 ] }, { "height": 480, "width": 640, "id": 904, "original_id": 1254377, "dataset_name": "refcoco", "area": 26215.070000000003, "iscrowd": 0, "image_id": 904, "category_id": 1, "bbox_list": [ [ 51.78, 225.44, 277.28999999999996, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577830.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white shirt left.", "normal_caption": "white shirt left", "solution": [ 51.78, 225.44, 278.29, 473.53 ], "normalized_solution": [ 80, 469, 434, 986 ] }, { "height": 480, "width": 640, "id": 905, "original_id": 1254377, "dataset_name": "refcoco", "area": 26215.070000000003, "iscrowd": 0, "image_id": 905, "category_id": 1, "bbox_list": [ [ 51.78, 225.44, 277.28999999999996, 472.53 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577830.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman in white on left.", "normal_caption": "woman in white on left", "solution": [ 51.78, 225.44, 278.29, 473.53 ], "normalized_solution": [ 80, 469, 434, 986 ] }, { "height": 640, "width": 480, "id": 906, "original_id": 1221971, "dataset_name": "refcoco", "area": 18114.64495, "iscrowd": 0, "image_id": 906, "category_id": 1, "bbox_list": [ [ 365.38, 1.09, 478.34, 243.92000000000002 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577819.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: person behind girl.", "normal_caption": "person behind girl", "solution": [ 365.38, 1.09, 479.34, 244.92 ], "normalized_solution": [ 761, 1, 998, 382 ] }, { "height": 640, "width": 480, "id": 907, "original_id": 1221971, "dataset_name": "refcoco", "area": 18114.64495, "iscrowd": 0, "image_id": 907, "category_id": 1, "bbox_list": [ [ 365.38, 1.09, 478.34, 243.92000000000002 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577819.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: seated person top right no head.", "normal_caption": "seated person top right no head", "solution": [ 365.38, 1.09, 479.34, 244.92 ], "normalized_solution": [ 761, 1, 998, 382 ] }, { "height": 640, "width": 480, "id": 908, "original_id": 1221971, "dataset_name": "refcoco", "area": 18114.64495, "iscrowd": 0, "image_id": 908, "category_id": 1, "bbox_list": [ [ 365.38, 1.09, 478.34, 243.92000000000002 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577819.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: upper right person.", "normal_caption": "upper right person", "solution": [ 365.38, 1.09, 479.34, 244.92 ], "normalized_solution": [ 761, 1, 998, 382 ] }, { "height": 640, "width": 480, "id": 909, "original_id": 455712, "dataset_name": "refcoco", "area": 160003.00319999995, "iscrowd": 0, "image_id": 909, "category_id": 1, "bbox_list": [ [ 27.2, 40.23, 475.78, 609.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577819.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 27.2, 40.23, 476.78, 610.07 ], "normalized_solution": [ 56, 62, 993, 953 ] }, { "height": 640, "width": 480, "id": 910, "original_id": 455712, "dataset_name": "refcoco", "area": 160003.00319999995, "iscrowd": 0, "image_id": 910, "category_id": 1, "bbox_list": [ [ 27.2, 40.23, 475.78, 609.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577819.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 27.2, 40.23, 476.78, 610.07 ], "normalized_solution": [ 56, 62, 993, 953 ] }, { "height": 640, "width": 480, "id": 911, "original_id": 455712, "dataset_name": "refcoco", "area": 160003.00319999995, "iscrowd": 0, "image_id": 911, "category_id": 1, "bbox_list": [ [ 27.2, 40.23, 475.78, 609.07 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577819.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl.", "normal_caption": "girl", "solution": [ 27.2, 40.23, 476.78, 610.07 ], "normalized_solution": [ 56, 62, 993, 953 ] }, { "height": 426, "width": 640, "id": 912, "original_id": 1549118, "dataset_name": "refcoco", "area": 16307.229499999998, "iscrowd": 0, "image_id": 912, "category_id": 53, "bbox_list": [ [ 253.83, 195.06, 385.51, 338.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle.", "normal_caption": "middle", "solution": [ 253.83, 195.06, 386.51, 339.96 ], "normalized_solution": [ 396, 457, 603, 798 ] }, { "height": 426, "width": 640, "id": 913, "original_id": 1549118, "dataset_name": "refcoco", "area": 16307.229499999998, "iscrowd": 0, "image_id": 913, "category_id": 53, "bbox_list": [ [ 253.83, 195.06, 385.51, 338.96000000000004 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle apple.", "normal_caption": "middle apple", "solution": [ 253.83, 195.06, 386.51, 339.96 ], "normalized_solution": [ 396, 457, 603, 798 ] }, { "height": 426, "width": 640, "id": 914, "original_id": 1548819, "dataset_name": "refcoco", "area": 18044.937849999995, "iscrowd": 0, "image_id": 914, "category_id": 53, "bbox_list": [ [ 430.17, 186.06, 578.22, 342.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: apple on the right.", "normal_caption": "apple on the right", "solution": [ 430.17, 186.06, 579.22, 343.32 ], "normalized_solution": [ 672, 436, 905, 805 ] }, { "height": 426, "width": 640, "id": 915, "original_id": 1548819, "dataset_name": "refcoco", "area": 18044.937849999995, "iscrowd": 0, "image_id": 915, "category_id": 53, "bbox_list": [ [ 430.17, 186.06, 578.22, 342.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: apple on far right.", "normal_caption": "apple on far right", "solution": [ 430.17, 186.06, 579.22, 343.32 ], "normalized_solution": [ 672, 436, 905, 805 ] }, { "height": 426, "width": 640, "id": 916, "original_id": 1548819, "dataset_name": "refcoco", "area": 18044.937849999995, "iscrowd": 0, "image_id": 916, "category_id": 53, "bbox_list": [ [ 430.17, 186.06, 578.22, 342.32 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right apple.", "normal_caption": "right apple", "solution": [ 430.17, 186.06, 579.22, 343.32 ], "normalized_solution": [ 672, 436, 905, 805 ] }, { "height": 426, "width": 640, "id": 917, "original_id": 1047794, "dataset_name": "refcoco", "area": 14968.431800000002, "iscrowd": 0, "image_id": 917, "category_id": 53, "bbox_list": [ [ 93.22, 201.47, 225.53, 333.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: leftmost apple.", "normal_caption": "leftmost apple", "solution": [ 93.22, 201.47, 226.53, 334.79 ], "normalized_solution": [ 145, 472, 353, 785 ] }, { "height": 426, "width": 640, "id": 918, "original_id": 1047794, "dataset_name": "refcoco", "area": 14968.431800000002, "iscrowd": 0, "image_id": 918, "category_id": 53, "bbox_list": [ [ 93.22, 201.47, 225.53, 333.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: apple on left.", "normal_caption": "apple on left", "solution": [ 93.22, 201.47, 226.53, 334.79 ], "normalized_solution": [ 145, 472, 353, 785 ] }, { "height": 426, "width": 640, "id": 919, "original_id": 1047794, "dataset_name": "refcoco", "area": 14968.431800000002, "iscrowd": 0, "image_id": 919, "category_id": 53, "bbox_list": [ [ 93.22, 201.47, 225.53, 333.78999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577809.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: apple on left.", "normal_caption": "apple on left", "solution": [ 93.22, 201.47, 226.53, 334.79 ], "normalized_solution": [ 145, 472, 353, 785 ] }, { "height": 612, "width": 612, "id": 920, "original_id": 311291, "dataset_name": "refcoco", "area": 40685.93230000001, "iscrowd": 0, "image_id": 920, "category_id": 54, "bbox_list": [ [ 275.81, 85.08, 586.3, 384.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577808.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right half of sandwhich.", "normal_caption": "right half of sandwhich", "solution": [ 275.81, 85.08, 587.3, 385.59 ], "normalized_solution": [ 450, 139, 959, 630 ] }, { "height": 612, "width": 612, "id": 921, "original_id": 311291, "dataset_name": "refcoco", "area": 40685.93230000001, "iscrowd": 0, "image_id": 921, "category_id": 54, "bbox_list": [ [ 275.81, 85.08, 586.3, 384.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577808.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right sandwhich.", "normal_caption": "right sandwhich", "solution": [ 275.81, 85.08, 587.3, 385.59 ], "normalized_solution": [ 450, 139, 959, 630 ] }, { "height": 612, "width": 612, "id": 922, "original_id": 311291, "dataset_name": "refcoco", "area": 40685.93230000001, "iscrowd": 0, "image_id": 922, "category_id": 54, "bbox_list": [ [ 275.81, 85.08, 586.3, 384.59 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577808.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right sandwich.", "normal_caption": "right sandwich", "solution": [ 275.81, 85.08, 587.3, 385.59 ], "normalized_solution": [ 450, 139, 959, 630 ] }, { "height": 612, "width": 612, "id": 923, "original_id": 310638, "dataset_name": "refcoco", "area": 64472.061050000004, "iscrowd": 0, "image_id": 923, "category_id": 54, "bbox_list": [ [ 24.76, 48.23, 458.34, 322.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577808.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left sandwich piece.", "normal_caption": "left sandwich piece", "solution": [ 24.76, 48.23, 459.34, 323.28 ], "normalized_solution": [ 40, 78, 750, 528 ] }, { "height": 612, "width": 612, "id": 924, "original_id": 310638, "dataset_name": "refcoco", "area": 64472.061050000004, "iscrowd": 0, "image_id": 924, "category_id": 54, "bbox_list": [ [ 24.76, 48.23, 458.34, 322.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577808.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top slicd.", "normal_caption": "top slicd", "solution": [ 24.76, 48.23, 459.34, 323.28 ], "normalized_solution": [ 40, 78, 750, 528 ] }, { "height": 612, "width": 612, "id": 925, "original_id": 310638, "dataset_name": "refcoco", "area": 64472.061050000004, "iscrowd": 0, "image_id": 925, "category_id": 54, "bbox_list": [ [ 24.76, 48.23, 458.34, 322.28000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577808.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top sandwich also left.", "normal_caption": "top sandwich also left", "solution": [ 24.76, 48.23, 459.34, 323.28 ], "normalized_solution": [ 40, 78, 750, 528 ] }, { "height": 640, "width": 536, "id": 926, "original_id": 1876330, "dataset_name": "refcoco", "area": 24701.384200000004, "iscrowd": 0, "image_id": 926, "category_id": 46, "bbox_list": [ [ 349.17, 36.02, 532.46, 407.60999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: last wine glass toward back.", "normal_caption": "last wine glass toward back", "solution": [ 349.17, 36.02, 533.46, 408.61 ], "normalized_solution": [ 651, 56, 995, 638 ] }, { "height": 640, "width": 536, "id": 927, "original_id": 1876330, "dataset_name": "refcoco", "area": 24701.384200000004, "iscrowd": 0, "image_id": 927, "category_id": 46, "bbox_list": [ [ 349.17, 36.02, 532.46, 407.60999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: empty wine glass.", "normal_caption": "empty wine glass", "solution": [ 349.17, 36.02, 533.46, 408.61 ], "normalized_solution": [ 651, 56, 995, 638 ] }, { "height": 640, "width": 536, "id": 928, "original_id": 1876232, "dataset_name": "refcoco", "area": 23829.947150000007, "iscrowd": 0, "image_id": 928, "category_id": 46, "bbox_list": [ [ 276.7, 51.08, 465.42999999999995, 448.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: third glass from back.", "normal_caption": "third glass from back", "solution": [ 276.7, 51.08, 466.43, 449.2 ], "normalized_solution": [ 516, 79, 870, 701 ] }, { "height": 640, "width": 536, "id": 929, "original_id": 1876232, "dataset_name": "refcoco", "area": 23829.947150000007, "iscrowd": 0, "image_id": 929, "category_id": 46, "bbox_list": [ [ 276.7, 51.08, 465.42999999999995, 448.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: glass second from the right.", "normal_caption": "glass second from the right", "solution": [ 276.7, 51.08, 466.43, 449.2 ], "normalized_solution": [ 516, 79, 870, 701 ] }, { "height": 640, "width": 536, "id": 930, "original_id": 1876232, "dataset_name": "refcoco", "area": 23829.947150000007, "iscrowd": 0, "image_id": 930, "category_id": 46, "bbox_list": [ [ 276.7, 51.08, 465.42999999999995, 448.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second glass from the right.", "normal_caption": "second glass from the right", "solution": [ 276.7, 51.08, 466.43, 449.2 ], "normalized_solution": [ 516, 79, 870, 701 ] }, { "height": 640, "width": 536, "id": 931, "original_id": 1874521, "dataset_name": "refcoco", "area": 24461.733150000007, "iscrowd": 0, "image_id": 931, "category_id": 46, "bbox_list": [ [ 183.37, 61.37, 374.74, 489.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: class in middle top.", "normal_caption": "class in middle top", "solution": [ 183.37, 61.37, 375.74, 490.25 ], "normalized_solution": [ 342, 95, 701, 766 ] }, { "height": 640, "width": 536, "id": 932, "original_id": 1874521, "dataset_name": "refcoco", "area": 24461.733150000007, "iscrowd": 0, "image_id": 932, "category_id": 46, "bbox_list": [ [ 183.37, 61.37, 374.74, 489.25 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle glass.", "normal_caption": "middle glass", "solution": [ 183.37, 61.37, 375.74, 490.25 ], "normalized_solution": [ 342, 95, 701, 766 ] }, { "height": 640, "width": 536, "id": 933, "original_id": 1498181, "dataset_name": "refcoco", "area": 17953.012399999996, "iscrowd": 0, "image_id": 933, "category_id": 46, "bbox_list": [ [ 97.06, 49.54, 289.1, 578.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: edge of glass third from left.", "normal_caption": "edge of glass third from left", "solution": [ 97.06, 49.54, 290.1, 579.51 ], "normalized_solution": [ 181, 77, 541, 905 ] }, { "height": 640, "width": 536, "id": 934, "original_id": 1498181, "dataset_name": "refcoco", "area": 17953.012399999996, "iscrowd": 0, "image_id": 934, "category_id": 46, "bbox_list": [ [ 97.06, 49.54, 289.1, 578.51 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: third in from left look at the stems of the cup.", "normal_caption": "third in from left look at the stems of the cup", "solution": [ 97.06, 49.54, 290.1, 579.51 ], "normalized_solution": [ 181, 77, 541, 905 ] }, { "height": 640, "width": 536, "id": 935, "original_id": 1497046, "dataset_name": "refcoco", "area": 40743.10730000001, "iscrowd": 0, "image_id": 935, "category_id": 46, "bbox_list": [ [ 46.68, 82.57, 285.12, 631.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second glass from front.", "normal_caption": "second glass from front", "solution": [ 46.68, 82.57, 286.12, 632.22 ], "normalized_solution": [ 87, 129, 533, 987 ] }, { "height": 640, "width": 536, "id": 936, "original_id": 1497046, "dataset_name": "refcoco", "area": 40743.10730000001, "iscrowd": 0, "image_id": 936, "category_id": 46, "bbox_list": [ [ 46.68, 82.57, 285.12, 631.22 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: second from left glass.", "normal_caption": "second from left glass", "solution": [ 46.68, 82.57, 286.12, 632.22 ], "normalized_solution": [ 87, 129, 533, 987 ] }, { "height": 640, "width": 536, "id": 937, "original_id": 1496371, "dataset_name": "refcoco", "area": 29269.47925, "iscrowd": 0, "image_id": 937, "category_id": 46, "bbox_list": [ [ 1.51, 35.89, 98.39, 479.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: glass left.", "normal_caption": "glass left", "solution": [ 1.51, 35.89, 99.39, 480.13 ], "normalized_solution": [ 2, 56, 185, 750 ] }, { "height": 640, "width": 536, "id": 938, "original_id": 1496371, "dataset_name": "refcoco", "area": 29269.47925, "iscrowd": 0, "image_id": 938, "category_id": 46, "bbox_list": [ [ 1.51, 35.89, 98.39, 479.13 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577657.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: first glass left.", "normal_caption": "first glass left", "solution": [ 1.51, 35.89, 99.39, 480.13 ], "normalized_solution": [ 2, 56, 185, 750 ] }, { "height": 480, "width": 640, "id": 939, "original_id": 492827, "dataset_name": "refcoco", "area": 50319.1093, "iscrowd": 0, "image_id": 939, "category_id": 1, "bbox_list": [ [ 143.46, 225.44, 485.47, 470.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577637.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man with white watch looking at phone.", "normal_caption": "man with white watch looking at phone", "solution": [ 143.46, 225.44, 486.47, 471.37 ], "normalized_solution": [ 224, 469, 760, 982 ] }, { "height": 480, "width": 640, "id": 940, "original_id": 492827, "dataset_name": "refcoco", "area": 50319.1093, "iscrowd": 0, "image_id": 940, "category_id": 1, "bbox_list": [ [ 143.46, 225.44, 485.47, 470.37 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577637.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle guy.", "normal_caption": "middle guy", "solution": [ 143.46, 225.44, 486.47, 471.37 ], "normalized_solution": [ 224, 469, 760, 982 ] }, { "height": 480, "width": 640, "id": 941, "original_id": 441450, "dataset_name": "refcoco", "area": 25694.69305, "iscrowd": 0, "image_id": 941, "category_id": 1, "bbox_list": [ [ 516.87, 154.28, 639.0, 478.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577637.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right guy.", "normal_caption": "right guy", "solution": [ 516.87, 154.28, 640.0, 479.02 ], "normalized_solution": [ 807, 321, 1000, 997 ] }, { "height": 480, "width": 640, "id": 942, "original_id": 441450, "dataset_name": "refcoco", "area": 25694.69305, "iscrowd": 0, "image_id": 942, "category_id": 1, "bbox_list": [ [ 516.87, 154.28, 639.0, 478.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577637.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: guy right.", "normal_caption": "guy right", "solution": [ 516.87, 154.28, 640.0, 479.02 ], "normalized_solution": [ 807, 321, 1000, 997 ] }, { "height": 504, "width": 640, "id": 943, "original_id": 486090, "dataset_name": "refcoco", "area": 25209.967249999998, "iscrowd": 0, "image_id": 943, "category_id": 1, "bbox_list": [ [ 306.98, 32.41, 450.70000000000005, 457.28999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink girl.", "normal_caption": "pink girl", "solution": [ 306.98, 32.41, 451.7, 458.29 ], "normalized_solution": [ 479, 64, 705, 909 ] }, { "height": 504, "width": 640, "id": 944, "original_id": 486090, "dataset_name": "refcoco", "area": 25209.967249999998, "iscrowd": 0, "image_id": 944, "category_id": 1, "bbox_list": [ [ 306.98, 32.41, 450.70000000000005, 457.28999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink.", "normal_caption": "pink", "solution": [ 306.98, 32.41, 451.7, 458.29 ], "normalized_solution": [ 479, 64, 705, 909 ] }, { "height": 504, "width": 640, "id": 945, "original_id": 486090, "dataset_name": "refcoco", "area": 25209.967249999998, "iscrowd": 0, "image_id": 945, "category_id": 1, "bbox_list": [ [ 306.98, 32.41, 450.70000000000005, 457.28999999999996 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: pink.", "normal_caption": "pink", "solution": [ 306.98, 32.41, 451.7, 458.29 ], "normalized_solution": [ 479, 64, 705, 909 ] }, { "height": 504, "width": 640, "id": 946, "original_id": 474480, "dataset_name": "refcoco", "area": 31877.49419999999, "iscrowd": 0, "image_id": 946, "category_id": 1, "bbox_list": [ [ 244.53, 45.39, 370.97, 458.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 244.53, 45.39, 371.97, 459.38 ], "normalized_solution": [ 382, 90, 581, 911 ] }, { "height": 504, "width": 640, "id": 947, "original_id": 474480, "dataset_name": "refcoco", "area": 31877.49419999999, "iscrowd": 0, "image_id": 947, "category_id": 1, "bbox_list": [ [ 244.53, 45.39, 370.97, 458.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 244.53, 45.39, 371.97, 459.38 ], "normalized_solution": [ 382, 90, 581, 911 ] }, { "height": 504, "width": 640, "id": 948, "original_id": 474480, "dataset_name": "refcoco", "area": 31877.49419999999, "iscrowd": 0, "image_id": 948, "category_id": 1, "bbox_list": [ [ 244.53, 45.39, 370.97, 458.38 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the man in the middle.", "normal_caption": "the man in the middle", "solution": [ 244.53, 45.39, 371.97, 459.38 ], "normalized_solution": [ 382, 90, 581, 911 ] }, { "height": 504, "width": 640, "id": 949, "original_id": 438914, "dataset_name": "refcoco", "area": 30508.647100000002, "iscrowd": 0, "image_id": 949, "category_id": 1, "bbox_list": [ [ 143.03, 41.43, 264.62, 447.95 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: blue dress left.", "normal_caption": "blue dress left", "solution": [ 143.03, 41.43, 265.62, 448.95 ], "normalized_solution": [ 223, 82, 415, 890 ] }, { "height": 504, "width": 640, "id": 950, "original_id": 438914, "dataset_name": "refcoco", "area": 30508.647100000002, "iscrowd": 0, "image_id": 950, "category_id": 1, "bbox_list": [ [ 143.03, 41.43, 264.62, 447.95 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the woman to the left.", "normal_caption": "the woman to the left", "solution": [ 143.03, 41.43, 265.62, 448.95 ], "normalized_solution": [ 223, 82, 415, 890 ] }, { "height": 504, "width": 640, "id": 951, "original_id": 438914, "dataset_name": "refcoco", "area": 30508.647100000002, "iscrowd": 0, "image_id": 951, "category_id": 1, "bbox_list": [ [ 143.03, 41.43, 264.62, 447.95 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577586.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: girl on left.", "normal_caption": "girl on left", "solution": [ 143.03, 41.43, 265.62, 448.95 ], "normalized_solution": [ 223, 82, 415, 890 ] }, { "height": 640, "width": 544, "id": 952, "original_id": 197375, "dataset_name": "refcoco", "area": 107469.06749999998, "iscrowd": 0, "image_id": 952, "category_id": 1, "bbox_list": [ [ 194.3, 18.91, 479.45, 590.23 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577556.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the guy.", "normal_caption": "the guy", "solution": [ 194.3, 18.91, 480.45, 591.23 ], "normalized_solution": [ 357, 29, 883, 923 ] }, { "height": 640, "width": 544, "id": 953, "original_id": 197375, "dataset_name": "refcoco", "area": 107469.06749999998, "iscrowd": 0, "image_id": 953, "category_id": 1, "bbox_list": [ [ 194.3, 18.91, 479.45, 590.23 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577556.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: man.", "normal_caption": "man", "solution": [ 194.3, 18.91, 480.45, 591.23 ], "normalized_solution": [ 357, 29, 883, 923 ] }, { "height": 640, "width": 544, "id": 954, "original_id": 197375, "dataset_name": "refcoco", "area": 107469.06749999998, "iscrowd": 0, "image_id": 954, "category_id": 1, "bbox_list": [ [ 194.3, 18.91, 479.45, 590.23 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577556.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: groom.", "normal_caption": "groom", "solution": [ 194.3, 18.91, 480.45, 591.23 ], "normalized_solution": [ 357, 29, 883, 923 ] }, { "height": 640, "width": 544, "id": 955, "original_id": 194366, "dataset_name": "refcoco", "area": 96465.63625000001, "iscrowd": 0, "image_id": 955, "category_id": 1, "bbox_list": [ [ 11.51, 66.16, 247.81, 631.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577556.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bride.", "normal_caption": "bride", "solution": [ 11.51, 66.16, 248.81, 632.81 ], "normalized_solution": [ 21, 103, 457, 988 ] }, { "height": 640, "width": 544, "id": 956, "original_id": 194366, "dataset_name": "refcoco", "area": 96465.63625000001, "iscrowd": 0, "image_id": 956, "category_id": 1, "bbox_list": [ [ 11.51, 66.16, 247.81, 631.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577556.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: women.", "normal_caption": "women", "solution": [ 11.51, 66.16, 248.81, 632.81 ], "normalized_solution": [ 21, 103, 457, 988 ] }, { "height": 640, "width": 544, "id": 957, "original_id": 194366, "dataset_name": "refcoco", "area": 96465.63625000001, "iscrowd": 0, "image_id": 957, "category_id": 1, "bbox_list": [ [ 11.51, 66.16, 247.81, 631.81 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577556.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: woman.", "normal_caption": "woman", "solution": [ 11.51, 66.16, 248.81, 632.81 ], "normalized_solution": [ 21, 103, 457, 988 ] }, { "height": 429, "width": 640, "id": 958, "original_id": 44179, "dataset_name": "refcoco", "area": 36802.91265000001, "iscrowd": 0, "image_id": 958, "category_id": 16, "bbox_list": [ [ 338.59, 187.28, 639.0, 423.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: closest to us of 3 birds right.", "normal_caption": "closest to us of 3 birds right", "solution": [ 338.59, 187.28, 640.0, 424.39 ], "normalized_solution": [ 529, 436, 1000, 989 ] }, { "height": 429, "width": 640, "id": 959, "original_id": 44179, "dataset_name": "refcoco", "area": 36802.91265000001, "iscrowd": 0, "image_id": 959, "category_id": 16, "bbox_list": [ [ 338.59, 187.28, 639.0, 423.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bird closest to camera.", "normal_caption": "bird closest to camera", "solution": [ 338.59, 187.28, 640.0, 424.39 ], "normalized_solution": [ 529, 436, 1000, 989 ] }, { "height": 429, "width": 640, "id": 960, "original_id": 44179, "dataset_name": "refcoco", "area": 36802.91265000001, "iscrowd": 0, "image_id": 960, "category_id": 16, "bbox_list": [ [ 338.59, 187.28, 639.0, 423.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bottom right bird.", "normal_caption": "bottom right bird", "solution": [ 338.59, 187.28, 640.0, 424.39 ], "normalized_solution": [ 529, 436, 1000, 989 ] }, { "height": 429, "width": 640, "id": 961, "original_id": 42629, "dataset_name": "refcoco", "area": 18793.17655, "iscrowd": 0, "image_id": 961, "category_id": 16, "bbox_list": [ [ 475.13, 54.15, 639.0, 293.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: bird farthest to the right.", "normal_caption": "bird farthest to the right", "solution": [ 475.13, 54.15, 640.0, 294.02 ], "normalized_solution": [ 742, 126, 1000, 685 ] }, { "height": 429, "width": 640, "id": 962, "original_id": 42629, "dataset_name": "refcoco", "area": 18793.17655, "iscrowd": 0, "image_id": 962, "category_id": 16, "bbox_list": [ [ 475.13, 54.15, 639.0, 293.02 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right bird.", "normal_caption": "far right bird", "solution": [ 475.13, 54.15, 640.0, 294.02 ], "normalized_solution": [ 742, 126, 1000, 685 ] }, { "height": 429, "width": 640, "id": 963, "original_id": 40243, "dataset_name": "refcoco", "area": 22666.28625, "iscrowd": 0, "image_id": 963, "category_id": 16, "bbox_list": [ [ 0.0, 167.81, 239.39, 414.59000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: leftmost and black bird.", "normal_caption": "leftmost and black bird", "solution": [ 0.0, 167.81, 240.39, 415.59 ], "normalized_solution": [ 0, 391, 375, 968 ] }, { "height": 429, "width": 640, "id": 964, "original_id": 40243, "dataset_name": "refcoco", "area": 22666.28625, "iscrowd": 0, "image_id": 964, "category_id": 16, "bbox_list": [ [ 0.0, 167.81, 239.39, 414.59000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: black bird to left.", "normal_caption": "black bird to left", "solution": [ 0.0, 167.81, 240.39, 415.59 ], "normalized_solution": [ 0, 391, 375, 968 ] }, { "height": 429, "width": 640, "id": 965, "original_id": 40243, "dataset_name": "refcoco", "area": 22666.28625, "iscrowd": 0, "image_id": 965, "category_id": 16, "bbox_list": [ [ 0.0, 167.81, 239.39, 414.59000000000003 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: all black bird left side.", "normal_caption": "all black bird left side", "solution": [ 0.0, 167.81, 240.39, 415.59 ], "normalized_solution": [ 0, 391, 375, 968 ] }, { "height": 429, "width": 640, "id": 966, "original_id": 36395, "dataset_name": "refcoco", "area": 14635.511000000004, "iscrowd": 0, "image_id": 966, "category_id": 16, "bbox_list": [ [ 346.89, 106.1, 590.37, 280.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: top bird second from right.", "normal_caption": "top bird second from right", "solution": [ 346.89, 106.1, 591.37, 281.39 ], "normalized_solution": [ 542, 247, 924, 655 ] }, { "height": 429, "width": 640, "id": 967, "original_id": 36395, "dataset_name": "refcoco", "area": 14635.511000000004, "iscrowd": 0, "image_id": 967, "category_id": 16, "bbox_list": [ [ 346.89, 106.1, 590.37, 280.39 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577455.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: middle bird in the group of 3.", "normal_caption": "middle bird in the group of 3", "solution": [ 346.89, 106.1, 591.37, 281.39 ], "normalized_solution": [ 542, 247, 924, 655 ] }, { "height": 375, "width": 500, "id": 968, "original_id": 1053804, "dataset_name": "refcoco", "area": 36596.324700000005, "iscrowd": 0, "image_id": 968, "category_id": 55, "bbox_list": [ [ 290.29, 65.29, 499.0, 366.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577447.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: fruit on bottom right.", "normal_caption": "fruit on bottom right", "solution": [ 290.29, 65.29, 500.0, 367.06 ], "normalized_solution": [ 580, 174, 1000, 978 ] }, { "height": 375, "width": 500, "id": 969, "original_id": 1053804, "dataset_name": "refcoco", "area": 36596.324700000005, "iscrowd": 0, "image_id": 969, "category_id": 55, "bbox_list": [ [ 290.29, 65.29, 499.0, 366.06 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577447.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: front right bowl small orangey fruit.", "normal_caption": "front right bowl small orangey fruit", "solution": [ 290.29, 65.29, 500.0, 367.06 ], "normalized_solution": [ 580, 174, 1000, 978 ] }, { "height": 375, "width": 500, "id": 970, "original_id": 1052973, "dataset_name": "refcoco", "area": 10353.9623, "iscrowd": 0, "image_id": 970, "category_id": 55, "bbox_list": [ [ 0.0, 75.7, 118.72, 190.9 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577447.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange in bowl on left sticking over side.", "normal_caption": "orange in bowl on left sticking over side", "solution": [ 0.0, 75.7, 119.72, 191.9 ], "normalized_solution": [ 0, 201, 239, 511 ] }, { "height": 375, "width": 500, "id": 971, "original_id": 1052973, "dataset_name": "refcoco", "area": 10353.9623, "iscrowd": 0, "image_id": 971, "category_id": 55, "bbox_list": [ [ 0.0, 75.7, 118.72, 190.9 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577447.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the orange to the far left left orangeleft bowl.", "normal_caption": "the orange to the far left left orangeleft bowl", "solution": [ 0.0, 75.7, 119.72, 191.9 ], "normalized_solution": [ 0, 201, 239, 511 ] }, { "height": 375, "width": 500, "id": 972, "original_id": 1052973, "dataset_name": "refcoco", "area": 10353.9623, "iscrowd": 0, "image_id": 972, "category_id": 55, "bbox_list": [ [ 0.0, 75.7, 118.72, 190.9 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577447.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: left bowl leftmost orange.", "normal_caption": "left bowl leftmost orange", "solution": [ 0.0, 75.7, 119.72, 191.9 ], "normalized_solution": [ 0, 201, 239, 511 ] }, { "height": 480, "width": 640, "id": 973, "original_id": 60287, "dataset_name": "refcoco", "area": 24364.93689999998, "iscrowd": 0, "image_id": 973, "category_id": 19, "bbox_list": [ [ 279.84, 164.12, 551.31, 390.67 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577421.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse on the right.", "normal_caption": "horse on the right", "solution": [ 279.84, 164.12, 552.31, 391.67 ], "normalized_solution": [ 437, 341, 862, 815 ] }, { "height": 480, "width": 640, "id": 974, "original_id": 60287, "dataset_name": "refcoco", "area": 24364.93689999998, "iscrowd": 0, "image_id": 974, "category_id": 19, "bbox_list": [ [ 279.84, 164.12, 551.31, 390.67 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577421.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right horse only the horse.", "normal_caption": "right horse only the horse", "solution": [ 279.84, 164.12, 552.31, 391.67 ], "normalized_solution": [ 437, 341, 862, 815 ] }, { "height": 480, "width": 640, "id": 975, "original_id": 60287, "dataset_name": "refcoco", "area": 24364.93689999998, "iscrowd": 0, "image_id": 975, "category_id": 19, "bbox_list": [ [ 279.84, 164.12, 551.31, 390.67 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577421.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right horse.", "normal_caption": "right horse", "solution": [ 279.84, 164.12, 552.31, 391.67 ], "normalized_solution": [ 437, 341, 862, 815 ] }, { "height": 480, "width": 640, "id": 976, "original_id": 56169, "dataset_name": "refcoco", "area": 15435.184499999998, "iscrowd": 0, "image_id": 976, "category_id": 19, "bbox_list": [ [ 169.75, 147.53, 342.53999999999996, 343.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577421.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse racing on the left.", "normal_caption": "horse racing on the left", "solution": [ 169.75, 147.53, 343.54, 344.0 ], "normalized_solution": [ 265, 307, 536, 716 ] }, { "height": 480, "width": 640, "id": 977, "original_id": 56169, "dataset_name": "refcoco", "area": 15435.184499999998, "iscrowd": 0, "image_id": 977, "category_id": 19, "bbox_list": [ [ 169.75, 147.53, 342.53999999999996, 343.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577421.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse on left.", "normal_caption": "horse on left", "solution": [ 169.75, 147.53, 343.54, 344.0 ], "normalized_solution": [ 265, 307, 536, 716 ] }, { "height": 480, "width": 640, "id": 978, "original_id": 1709252, "dataset_name": "refcoco", "area": 76398.28319999999, "iscrowd": 0, "image_id": 978, "category_id": 1, "bbox_list": [ [ 0.0, 195.24, 534.01, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577416.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: creepy arm.", "normal_caption": "creepy arm", "solution": [ 0.0, 195.24, 535.01, 480.0 ], "normalized_solution": [ 0, 406, 835, 1000 ] }, { "height": 480, "width": 640, "id": 979, "original_id": 1709252, "dataset_name": "refcoco", "area": 76398.28319999999, "iscrowd": 0, "image_id": 979, "category_id": 1, "bbox_list": [ [ 0.0, 195.24, 534.01, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577416.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: persons arm.", "normal_caption": "persons arm", "solution": [ 0.0, 195.24, 535.01, 480.0 ], "normalized_solution": [ 0, 406, 835, 1000 ] }, { "height": 480, "width": 640, "id": 980, "original_id": 1709252, "dataset_name": "refcoco", "area": 76398.28319999999, "iscrowd": 0, "image_id": 980, "category_id": 1, "bbox_list": [ [ 0.0, 195.24, 534.01, 479.0 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577416.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: hand on the blender.", "normal_caption": "hand on the blender", "solution": [ 0.0, 195.24, 535.01, 480.0 ], "normalized_solution": [ 0, 406, 835, 1000 ] }, { "height": 480, "width": 640, "id": 981, "original_id": 1053665, "dataset_name": "refcoco", "area": 14196.564, "iscrowd": 0, "image_id": 981, "category_id": 55, "bbox_list": [ [ 81.04, 199.01, 220.12, 361.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577405.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange in middle on the left.", "normal_caption": "orange in middle on the left", "solution": [ 81.04, 199.01, 221.12, 362.2 ], "normalized_solution": [ 126, 414, 345, 754 ] }, { "height": 480, "width": 640, "id": 982, "original_id": 1053665, "dataset_name": "refcoco", "area": 14196.564, "iscrowd": 0, "image_id": 982, "category_id": 55, "bbox_list": [ [ 81.04, 199.01, 220.12, 361.2 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577405.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: partial orange second from bottom on left.", "normal_caption": "partial orange second from bottom on left", "solution": [ 81.04, 199.01, 221.12, 362.2 ], "normalized_solution": [ 126, 414, 345, 754 ] }, { "height": 480, "width": 640, "id": 983, "original_id": 1050997, "dataset_name": "refcoco", "area": 28126.108900000007, "iscrowd": 0, "image_id": 983, "category_id": 55, "bbox_list": [ [ 166.02, 215.72, 363.8, 396.55 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577405.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange in front.", "normal_caption": "orange in front", "solution": [ 166.02, 215.72, 364.8, 397.55 ], "normalized_solution": [ 259, 449, 570, 828 ] }, { "height": 480, "width": 640, "id": 984, "original_id": 1050997, "dataset_name": "refcoco", "area": 28126.108900000007, "iscrowd": 0, "image_id": 984, "category_id": 55, "bbox_list": [ [ 166.02, 215.72, 363.8, 396.55 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577405.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange bottom front.", "normal_caption": "orange bottom front", "solution": [ 166.02, 215.72, 364.8, 397.55 ], "normalized_solution": [ 259, 449, 570, 828 ] }, { "height": 480, "width": 640, "id": 985, "original_id": 1050997, "dataset_name": "refcoco", "area": 28126.108900000007, "iscrowd": 0, "image_id": 985, "category_id": 55, "bbox_list": [ [ 166.02, 215.72, 363.8, 396.55 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577405.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: orange closest to you next to apple.", "normal_caption": "orange closest to you next to apple", "solution": [ 166.02, 215.72, 364.8, 397.55 ], "normalized_solution": [ 259, 449, 570, 828 ] }, { "height": 428, "width": 640, "id": 986, "original_id": 59402, "dataset_name": "refcoco", "area": 12654.579749999999, "iscrowd": 0, "image_id": 986, "category_id": 19, "bbox_list": [ [ 174.88, 154.63, 290.78, 415.95 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577362.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse on left.", "normal_caption": "horse on left", "solution": [ 174.88, 154.63, 291.78, 416.95 ], "normalized_solution": [ 273, 361, 455, 974 ] }, { "height": 428, "width": 640, "id": 987, "original_id": 59402, "dataset_name": "refcoco", "area": 12654.579749999999, "iscrowd": 0, "image_id": 987, "category_id": 19, "bbox_list": [ [ 174.88, 154.63, 290.78, 415.95 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577362.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse on left.", "normal_caption": "horse on left", "solution": [ 174.88, 154.63, 291.78, 416.95 ], "normalized_solution": [ 273, 361, 455, 974 ] }, { "height": 428, "width": 640, "id": 988, "original_id": 59402, "dataset_name": "refcoco", "area": 12654.579749999999, "iscrowd": 0, "image_id": 988, "category_id": 19, "bbox_list": [ [ 174.88, 154.63, 290.78, 415.95 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577362.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse left.", "normal_caption": "horse left", "solution": [ 174.88, 154.63, 291.78, 416.95 ], "normalized_solution": [ 273, 361, 455, 974 ] }, { "height": 428, "width": 640, "id": 989, "original_id": 58107, "dataset_name": "refcoco", "area": 12454.57325, "iscrowd": 0, "image_id": 989, "category_id": 19, "bbox_list": [ [ 404.17, 232.0, 515.9, 400.55 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577362.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: horse on right.", "normal_caption": "horse on right", "solution": [ 404.17, 232.0, 516.9, 401.55 ], "normalized_solution": [ 631, 542, 807, 938 ] }, { "height": 428, "width": 640, "id": 990, "original_id": 58107, "dataset_name": "refcoco", "area": 12454.57325, "iscrowd": 0, "image_id": 990, "category_id": 19, "bbox_list": [ [ 404.17, 232.0, 515.9, 400.55 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577362.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: back of right side of horse.", "normal_caption": "back of right side of horse", "solution": [ 404.17, 232.0, 516.9, 401.55 ], "normalized_solution": [ 631, 542, 807, 938 ] }, { "height": 428, "width": 640, "id": 991, "original_id": 58107, "dataset_name": "refcoco", "area": 12454.57325, "iscrowd": 0, "image_id": 991, "category_id": 19, "bbox_list": [ [ 404.17, 232.0, 515.9, 400.55 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577362.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: back of horse.", "normal_caption": "back of horse", "solution": [ 404.17, 232.0, 516.9, 401.55 ], "normalized_solution": [ 631, 542, 807, 938 ] }, { "height": 640, "width": 480, "id": 992, "original_id": 201468, "dataset_name": "refcoco", "area": 10568.67365, "iscrowd": 0, "image_id": 992, "category_id": 1, "bbox_list": [ [ 396.46, 281.59, 479.0, 523.4 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577358.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white coat.", "normal_caption": "white coat", "solution": [ 396.46, 281.59, 480.0, 524.4 ], "normalized_solution": [ 825, 439, 1000, 819 ] }, { "height": 640, "width": 480, "id": 993, "original_id": 201468, "dataset_name": "refcoco", "area": 10568.67365, "iscrowd": 0, "image_id": 993, "category_id": 1, "bbox_list": [ [ 396.46, 281.59, 479.0, 523.4 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577358.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white coat window shopping.", "normal_caption": "white coat window shopping", "solution": [ 396.46, 281.59, 480.0, 524.4 ], "normalized_solution": [ 825, 439, 1000, 819 ] }, { "height": 640, "width": 480, "id": 994, "original_id": 201468, "dataset_name": "refcoco", "area": 10568.67365, "iscrowd": 0, "image_id": 994, "category_id": 1, "bbox_list": [ [ 396.46, 281.59, 479.0, 523.4 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577358.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: white jacket.", "normal_caption": "white jacket", "solution": [ 396.46, 281.59, 480.0, 524.4 ], "normalized_solution": [ 825, 439, 1000, 819 ] }, { "height": 494, "width": 640, "id": 995, "original_id": 165858, "dataset_name": "refcoco", "area": 11651.181999999993, "iscrowd": 0, "image_id": 995, "category_id": 6, "bbox_list": [ [ 533.96, 187.61, 639.0, 346.47 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577343.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: far right bus.", "normal_caption": "far right bus", "solution": [ 533.96, 187.61, 640.0, 347.47 ], "normalized_solution": [ 834, 379, 1000, 703 ] }, { "height": 494, "width": 640, "id": 996, "original_id": 165858, "dataset_name": "refcoco", "area": 11651.181999999993, "iscrowd": 0, "image_id": 996, "category_id": 6, "bbox_list": [ [ 533.96, 187.61, 639.0, 346.47 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577343.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: right red bus.", "normal_caption": "right red bus", "solution": [ 533.96, 187.61, 640.0, 347.47 ], "normalized_solution": [ 834, 379, 1000, 703 ] }, { "height": 494, "width": 640, "id": 997, "original_id": 165858, "dataset_name": "refcoco", "area": 11651.181999999993, "iscrowd": 0, "image_id": 997, "category_id": 6, "bbox_list": [ [ 533.96, 187.61, 639.0, 346.47 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577343.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: red bus in background on right.", "normal_caption": "red bus in background on right", "solution": [ 533.96, 187.61, 640.0, 347.47 ], "normalized_solution": [ 834, 379, 1000, 703 ] }, { "height": 494, "width": 640, "id": 998, "original_id": 163229, "dataset_name": "refcoco", "area": 122402.49605000002, "iscrowd": 0, "image_id": 998, "category_id": 6, "bbox_list": [ [ 174.75, 73.19, 532.21, 454.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577343.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: closest red bus.", "normal_caption": "closest red bus", "solution": [ 174.75, 73.19, 533.21, 455.17 ], "normalized_solution": [ 273, 148, 833, 921 ] }, { "height": 494, "width": 640, "id": 999, "original_id": 163229, "dataset_name": "refcoco", "area": 122402.49605000002, "iscrowd": 0, "image_id": 999, "category_id": 6, "bbox_list": [ [ 174.75, 73.19, 532.21, 454.17 ] ], "text_type": "caption", "image": "train2014/COCO_train2014_000000577343.jpg", "problem": "Please provide the bounding box coordinate of the region this sentence describes: the bus right in front.", "normal_caption": "the bus right in front", "solution": [ 174.75, 73.19, 533.21, 455.17 ], "normalized_solution": [ 273, 148, 833, 921 ] } ]